]> git.ipfire.org Git - thirdparty/binutils-gdb.git/blob - gas/config/tc-i386.c
d7d45de76e0f7af5bb61fbde10292cdce29a4db3
[thirdparty/binutils-gdb.git] / gas / config / tc-i386.c
1 /* tc-i386.c -- Assemble code for the Intel 80386
2 Copyright (C) 1989-2020 Free Software Foundation, Inc.
3
4 This file is part of GAS, the GNU Assembler.
5
6 GAS is free software; you can redistribute it and/or modify
7 it under the terms of the GNU General Public License as published by
8 the Free Software Foundation; either version 3, or (at your option)
9 any later version.
10
11 GAS is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 GNU General Public License for more details.
15
16 You should have received a copy of the GNU General Public License
17 along with GAS; see the file COPYING. If not, write to the Free
18 Software Foundation, 51 Franklin Street - Fifth Floor, Boston, MA
19 02110-1301, USA. */
20
21 /* Intel 80386 machine specific gas.
22 Written by Eliot Dresselhaus (eliot@mgm.mit.edu).
23 x86_64 support by Jan Hubicka (jh@suse.cz)
24 VIA PadLock support by Michal Ludvig (mludvig@suse.cz)
25 Bugs & suggestions are completely welcome. This is free software.
26 Please help us make it better. */
27
28 #include "as.h"
29 #include "safe-ctype.h"
30 #include "subsegs.h"
31 #include "dwarf2dbg.h"
32 #include "dw2gencfi.h"
33 #include "elf/x86-64.h"
34 #include "opcodes/i386-init.h"
35
36 #ifdef HAVE_LIMITS_H
37 #include <limits.h>
38 #else
39 #ifdef HAVE_SYS_PARAM_H
40 #include <sys/param.h>
41 #endif
42 #ifndef INT_MAX
43 #define INT_MAX (int) (((unsigned) (-1)) >> 1)
44 #endif
45 #endif
46
47 #ifndef INFER_ADDR_PREFIX
48 #define INFER_ADDR_PREFIX 1
49 #endif
50
51 #ifndef DEFAULT_ARCH
52 #define DEFAULT_ARCH "i386"
53 #endif
54
55 #ifndef INLINE
56 #if __GNUC__ >= 2
57 #define INLINE __inline__
58 #else
59 #define INLINE
60 #endif
61 #endif
62
63 /* Prefixes will be emitted in the order defined below.
64 WAIT_PREFIX must be the first prefix since FWAIT is really is an
65 instruction, and so must come before any prefixes.
66 The preferred prefix order is SEG_PREFIX, ADDR_PREFIX, DATA_PREFIX,
67 REP_PREFIX/HLE_PREFIX, LOCK_PREFIX. */
68 #define WAIT_PREFIX 0
69 #define SEG_PREFIX 1
70 #define ADDR_PREFIX 2
71 #define DATA_PREFIX 3
72 #define REP_PREFIX 4
73 #define HLE_PREFIX REP_PREFIX
74 #define BND_PREFIX REP_PREFIX
75 #define LOCK_PREFIX 5
76 #define REX_PREFIX 6 /* must come last. */
77 #define MAX_PREFIXES 7 /* max prefixes per opcode */
78
79 /* we define the syntax here (modulo base,index,scale syntax) */
80 #define REGISTER_PREFIX '%'
81 #define IMMEDIATE_PREFIX '$'
82 #define ABSOLUTE_PREFIX '*'
83
84 /* these are the instruction mnemonic suffixes in AT&T syntax or
85 memory operand size in Intel syntax. */
86 #define WORD_MNEM_SUFFIX 'w'
87 #define BYTE_MNEM_SUFFIX 'b'
88 #define SHORT_MNEM_SUFFIX 's'
89 #define LONG_MNEM_SUFFIX 'l'
90 #define QWORD_MNEM_SUFFIX 'q'
91 /* Intel Syntax. Use a non-ascii letter since since it never appears
92 in instructions. */
93 #define LONG_DOUBLE_MNEM_SUFFIX '\1'
94
95 #define END_OF_INSN '\0'
96
97 /* This matches the C -> StaticRounding alias in the opcode table. */
98 #define commutative staticrounding
99
100 /*
101 'templates' is for grouping together 'template' structures for opcodes
102 of the same name. This is only used for storing the insns in the grand
103 ole hash table of insns.
104 The templates themselves start at START and range up to (but not including)
105 END.
106 */
107 typedef struct
108 {
109 const insn_template *start;
110 const insn_template *end;
111 }
112 templates;
113
114 /* 386 operand encoding bytes: see 386 book for details of this. */
115 typedef struct
116 {
117 unsigned int regmem; /* codes register or memory operand */
118 unsigned int reg; /* codes register operand (or extended opcode) */
119 unsigned int mode; /* how to interpret regmem & reg */
120 }
121 modrm_byte;
122
123 /* x86-64 extension prefix. */
124 typedef int rex_byte;
125
126 /* 386 opcode byte to code indirect addressing. */
127 typedef struct
128 {
129 unsigned base;
130 unsigned index;
131 unsigned scale;
132 }
133 sib_byte;
134
135 /* x86 arch names, types and features */
136 typedef struct
137 {
138 const char *name; /* arch name */
139 unsigned int len; /* arch string length */
140 enum processor_type type; /* arch type */
141 i386_cpu_flags flags; /* cpu feature flags */
142 unsigned int skip; /* show_arch should skip this. */
143 }
144 arch_entry;
145
146 /* Used to turn off indicated flags. */
147 typedef struct
148 {
149 const char *name; /* arch name */
150 unsigned int len; /* arch string length */
151 i386_cpu_flags flags; /* cpu feature flags */
152 }
153 noarch_entry;
154
155 static void update_code_flag (int, int);
156 static void set_code_flag (int);
157 static void set_16bit_gcc_code_flag (int);
158 static void set_intel_syntax (int);
159 static void set_intel_mnemonic (int);
160 static void set_allow_index_reg (int);
161 static void set_check (int);
162 static void set_cpu_arch (int);
163 #ifdef TE_PE
164 static void pe_directive_secrel (int);
165 #endif
166 static void signed_cons (int);
167 static char *output_invalid (int c);
168 static int i386_finalize_immediate (segT, expressionS *, i386_operand_type,
169 const char *);
170 static int i386_finalize_displacement (segT, expressionS *, i386_operand_type,
171 const char *);
172 static int i386_att_operand (char *);
173 static int i386_intel_operand (char *, int);
174 static int i386_intel_simplify (expressionS *);
175 static int i386_intel_parse_name (const char *, expressionS *);
176 static const reg_entry *parse_register (char *, char **);
177 static char *parse_insn (char *, char *);
178 static char *parse_operands (char *, const char *);
179 static void swap_operands (void);
180 static void swap_2_operands (int, int);
181 static enum flag_code i386_addressing_mode (void);
182 static void optimize_imm (void);
183 static void optimize_disp (void);
184 static const insn_template *match_template (char);
185 static int check_string (void);
186 static int process_suffix (void);
187 static int check_byte_reg (void);
188 static int check_long_reg (void);
189 static int check_qword_reg (void);
190 static int check_word_reg (void);
191 static int finalize_imm (void);
192 static int process_operands (void);
193 static const seg_entry *build_modrm_byte (void);
194 static void output_insn (void);
195 static void output_imm (fragS *, offsetT);
196 static void output_disp (fragS *, offsetT);
197 #ifndef I386COFF
198 static void s_bss (int);
199 #endif
200 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
201 static void handle_large_common (int small ATTRIBUTE_UNUSED);
202
203 /* GNU_PROPERTY_X86_ISA_1_USED. */
204 static unsigned int x86_isa_1_used;
205 /* GNU_PROPERTY_X86_FEATURE_2_USED. */
206 static unsigned int x86_feature_2_used;
207 /* Generate x86 used ISA and feature properties. */
208 static unsigned int x86_used_note = DEFAULT_X86_USED_NOTE;
209 #endif
210
211 static const char *default_arch = DEFAULT_ARCH;
212
213 /* This struct describes rounding control and SAE in the instruction. */
214 struct RC_Operation
215 {
216 enum rc_type
217 {
218 rne = 0,
219 rd,
220 ru,
221 rz,
222 saeonly
223 } type;
224 int operand;
225 };
226
227 static struct RC_Operation rc_op;
228
229 /* The struct describes masking, applied to OPERAND in the instruction.
230 MASK is a pointer to the corresponding mask register. ZEROING tells
231 whether merging or zeroing mask is used. */
232 struct Mask_Operation
233 {
234 const reg_entry *mask;
235 unsigned int zeroing;
236 /* The operand where this operation is associated. */
237 int operand;
238 };
239
240 static struct Mask_Operation mask_op;
241
242 /* The struct describes broadcasting, applied to OPERAND. FACTOR is
243 broadcast factor. */
244 struct Broadcast_Operation
245 {
246 /* Type of broadcast: {1to2}, {1to4}, {1to8}, or {1to16}. */
247 int type;
248
249 /* Index of broadcasted operand. */
250 int operand;
251
252 /* Number of bytes to broadcast. */
253 int bytes;
254 };
255
256 static struct Broadcast_Operation broadcast_op;
257
258 /* VEX prefix. */
259 typedef struct
260 {
261 /* VEX prefix is either 2 byte or 3 byte. EVEX is 4 byte. */
262 unsigned char bytes[4];
263 unsigned int length;
264 /* Destination or source register specifier. */
265 const reg_entry *register_specifier;
266 } vex_prefix;
267
268 /* 'md_assemble ()' gathers together information and puts it into a
269 i386_insn. */
270
271 union i386_op
272 {
273 expressionS *disps;
274 expressionS *imms;
275 const reg_entry *regs;
276 };
277
278 enum i386_error
279 {
280 operand_size_mismatch,
281 operand_type_mismatch,
282 register_type_mismatch,
283 number_of_operands_mismatch,
284 invalid_instruction_suffix,
285 bad_imm4,
286 unsupported_with_intel_mnemonic,
287 unsupported_syntax,
288 unsupported,
289 invalid_vsib_address,
290 invalid_vector_register_set,
291 unsupported_vector_index_register,
292 unsupported_broadcast,
293 broadcast_needed,
294 unsupported_masking,
295 mask_not_on_destination,
296 no_default_mask,
297 unsupported_rc_sae,
298 rc_sae_operand_not_last_imm,
299 invalid_register_operand,
300 };
301
302 struct _i386_insn
303 {
304 /* TM holds the template for the insn were currently assembling. */
305 insn_template tm;
306
307 /* SUFFIX holds the instruction size suffix for byte, word, dword
308 or qword, if given. */
309 char suffix;
310
311 /* OPERANDS gives the number of given operands. */
312 unsigned int operands;
313
314 /* REG_OPERANDS, DISP_OPERANDS, MEM_OPERANDS, IMM_OPERANDS give the number
315 of given register, displacement, memory operands and immediate
316 operands. */
317 unsigned int reg_operands, disp_operands, mem_operands, imm_operands;
318
319 /* TYPES [i] is the type (see above #defines) which tells us how to
320 use OP[i] for the corresponding operand. */
321 i386_operand_type types[MAX_OPERANDS];
322
323 /* Displacement expression, immediate expression, or register for each
324 operand. */
325 union i386_op op[MAX_OPERANDS];
326
327 /* Flags for operands. */
328 unsigned int flags[MAX_OPERANDS];
329 #define Operand_PCrel 1
330 #define Operand_Mem 2
331
332 /* Relocation type for operand */
333 enum bfd_reloc_code_real reloc[MAX_OPERANDS];
334
335 /* BASE_REG, INDEX_REG, and LOG2_SCALE_FACTOR are used to encode
336 the base index byte below. */
337 const reg_entry *base_reg;
338 const reg_entry *index_reg;
339 unsigned int log2_scale_factor;
340
341 /* SEG gives the seg_entries of this insn. They are zero unless
342 explicit segment overrides are given. */
343 const seg_entry *seg[2];
344
345 /* Copied first memory operand string, for re-checking. */
346 char *memop1_string;
347
348 /* PREFIX holds all the given prefix opcodes (usually null).
349 PREFIXES is the number of prefix opcodes. */
350 unsigned int prefixes;
351 unsigned char prefix[MAX_PREFIXES];
352
353 /* Register is in low 3 bits of opcode. */
354 bfd_boolean short_form;
355
356 /* The operand to a branch insn indicates an absolute branch. */
357 bfd_boolean jumpabsolute;
358
359 /* Has MMX register operands. */
360 bfd_boolean has_regmmx;
361
362 /* Has XMM register operands. */
363 bfd_boolean has_regxmm;
364
365 /* Has YMM register operands. */
366 bfd_boolean has_regymm;
367
368 /* Has ZMM register operands. */
369 bfd_boolean has_regzmm;
370
371 /* Has GOTPC or TLS relocation. */
372 bfd_boolean has_gotpc_tls_reloc;
373
374 /* RM and SIB are the modrm byte and the sib byte where the
375 addressing modes of this insn are encoded. */
376 modrm_byte rm;
377 rex_byte rex;
378 rex_byte vrex;
379 sib_byte sib;
380 vex_prefix vex;
381
382 /* Masking attributes. */
383 struct Mask_Operation *mask;
384
385 /* Rounding control and SAE attributes. */
386 struct RC_Operation *rounding;
387
388 /* Broadcasting attributes. */
389 struct Broadcast_Operation *broadcast;
390
391 /* Compressed disp8*N attribute. */
392 unsigned int memshift;
393
394 /* Prefer load or store in encoding. */
395 enum
396 {
397 dir_encoding_default = 0,
398 dir_encoding_load,
399 dir_encoding_store,
400 dir_encoding_swap
401 } dir_encoding;
402
403 /* Prefer 8bit or 32bit displacement in encoding. */
404 enum
405 {
406 disp_encoding_default = 0,
407 disp_encoding_8bit,
408 disp_encoding_32bit
409 } disp_encoding;
410
411 /* Prefer the REX byte in encoding. */
412 bfd_boolean rex_encoding;
413
414 /* Disable instruction size optimization. */
415 bfd_boolean no_optimize;
416
417 /* How to encode vector instructions. */
418 enum
419 {
420 vex_encoding_default = 0,
421 vex_encoding_vex,
422 vex_encoding_vex3,
423 vex_encoding_evex
424 } vec_encoding;
425
426 /* REP prefix. */
427 const char *rep_prefix;
428
429 /* HLE prefix. */
430 const char *hle_prefix;
431
432 /* Have BND prefix. */
433 const char *bnd_prefix;
434
435 /* Have NOTRACK prefix. */
436 const char *notrack_prefix;
437
438 /* Error message. */
439 enum i386_error error;
440 };
441
442 typedef struct _i386_insn i386_insn;
443
444 /* Link RC type with corresponding string, that'll be looked for in
445 asm. */
446 struct RC_name
447 {
448 enum rc_type type;
449 const char *name;
450 unsigned int len;
451 };
452
453 static const struct RC_name RC_NamesTable[] =
454 {
455 { rne, STRING_COMMA_LEN ("rn-sae") },
456 { rd, STRING_COMMA_LEN ("rd-sae") },
457 { ru, STRING_COMMA_LEN ("ru-sae") },
458 { rz, STRING_COMMA_LEN ("rz-sae") },
459 { saeonly, STRING_COMMA_LEN ("sae") },
460 };
461
462 /* List of chars besides those in app.c:symbol_chars that can start an
463 operand. Used to prevent the scrubber eating vital white-space. */
464 const char extra_symbol_chars[] = "*%-([{}"
465 #ifdef LEX_AT
466 "@"
467 #endif
468 #ifdef LEX_QM
469 "?"
470 #endif
471 ;
472
473 #if (defined (TE_I386AIX) \
474 || ((defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)) \
475 && !defined (TE_GNU) \
476 && !defined (TE_LINUX) \
477 && !defined (TE_NACL) \
478 && !defined (TE_FreeBSD) \
479 && !defined (TE_DragonFly) \
480 && !defined (TE_NetBSD)))
481 /* This array holds the chars that always start a comment. If the
482 pre-processor is disabled, these aren't very useful. The option
483 --divide will remove '/' from this list. */
484 const char *i386_comment_chars = "#/";
485 #define SVR4_COMMENT_CHARS 1
486 #define PREFIX_SEPARATOR '\\'
487
488 #else
489 const char *i386_comment_chars = "#";
490 #define PREFIX_SEPARATOR '/'
491 #endif
492
493 /* This array holds the chars that only start a comment at the beginning of
494 a line. If the line seems to have the form '# 123 filename'
495 .line and .file directives will appear in the pre-processed output.
496 Note that input_file.c hand checks for '#' at the beginning of the
497 first line of the input file. This is because the compiler outputs
498 #NO_APP at the beginning of its output.
499 Also note that comments started like this one will always work if
500 '/' isn't otherwise defined. */
501 const char line_comment_chars[] = "#/";
502
503 const char line_separator_chars[] = ";";
504
505 /* Chars that can be used to separate mant from exp in floating point
506 nums. */
507 const char EXP_CHARS[] = "eE";
508
509 /* Chars that mean this number is a floating point constant
510 As in 0f12.456
511 or 0d1.2345e12. */
512 const char FLT_CHARS[] = "fFdDxX";
513
514 /* Tables for lexical analysis. */
515 static char mnemonic_chars[256];
516 static char register_chars[256];
517 static char operand_chars[256];
518 static char identifier_chars[256];
519 static char digit_chars[256];
520
521 /* Lexical macros. */
522 #define is_mnemonic_char(x) (mnemonic_chars[(unsigned char) x])
523 #define is_operand_char(x) (operand_chars[(unsigned char) x])
524 #define is_register_char(x) (register_chars[(unsigned char) x])
525 #define is_space_char(x) ((x) == ' ')
526 #define is_identifier_char(x) (identifier_chars[(unsigned char) x])
527 #define is_digit_char(x) (digit_chars[(unsigned char) x])
528
529 /* All non-digit non-letter characters that may occur in an operand. */
530 static char operand_special_chars[] = "%$-+(,)*._~/<>|&^!:[@]";
531
532 /* md_assemble() always leaves the strings it's passed unaltered. To
533 effect this we maintain a stack of saved characters that we've smashed
534 with '\0's (indicating end of strings for various sub-fields of the
535 assembler instruction). */
536 static char save_stack[32];
537 static char *save_stack_p;
538 #define END_STRING_AND_SAVE(s) \
539 do { *save_stack_p++ = *(s); *(s) = '\0'; } while (0)
540 #define RESTORE_END_STRING(s) \
541 do { *(s) = *--save_stack_p; } while (0)
542
543 /* The instruction we're assembling. */
544 static i386_insn i;
545
546 /* Possible templates for current insn. */
547 static const templates *current_templates;
548
549 /* Per instruction expressionS buffers: max displacements & immediates. */
550 static expressionS disp_expressions[MAX_MEMORY_OPERANDS];
551 static expressionS im_expressions[MAX_IMMEDIATE_OPERANDS];
552
553 /* Current operand we are working on. */
554 static int this_operand = -1;
555
556 /* We support four different modes. FLAG_CODE variable is used to distinguish
557 these. */
558
559 enum flag_code {
560 CODE_32BIT,
561 CODE_16BIT,
562 CODE_64BIT };
563
564 static enum flag_code flag_code;
565 static unsigned int object_64bit;
566 static unsigned int disallow_64bit_reloc;
567 static int use_rela_relocations = 0;
568 /* __tls_get_addr/___tls_get_addr symbol for TLS. */
569 static const char *tls_get_addr;
570
571 #if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
572 || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
573 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
574
575 /* The ELF ABI to use. */
576 enum x86_elf_abi
577 {
578 I386_ABI,
579 X86_64_ABI,
580 X86_64_X32_ABI
581 };
582
583 static enum x86_elf_abi x86_elf_abi = I386_ABI;
584 #endif
585
586 #if defined (TE_PE) || defined (TE_PEP)
587 /* Use big object file format. */
588 static int use_big_obj = 0;
589 #endif
590
591 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
592 /* 1 if generating code for a shared library. */
593 static int shared = 0;
594 #endif
595
596 /* 1 for intel syntax,
597 0 if att syntax. */
598 static int intel_syntax = 0;
599
600 static enum x86_64_isa
601 {
602 amd64 = 1, /* AMD64 ISA. */
603 intel64 /* Intel64 ISA. */
604 } isa64;
605
606 /* 1 for intel mnemonic,
607 0 if att mnemonic. */
608 static int intel_mnemonic = !SYSV386_COMPAT;
609
610 /* 1 if pseudo registers are permitted. */
611 static int allow_pseudo_reg = 0;
612
613 /* 1 if register prefix % not required. */
614 static int allow_naked_reg = 0;
615
616 /* 1 if the assembler should add BND prefix for all control-transferring
617 instructions supporting it, even if this prefix wasn't specified
618 explicitly. */
619 static int add_bnd_prefix = 0;
620
621 /* 1 if pseudo index register, eiz/riz, is allowed . */
622 static int allow_index_reg = 0;
623
624 /* 1 if the assembler should ignore LOCK prefix, even if it was
625 specified explicitly. */
626 static int omit_lock_prefix = 0;
627
628 /* 1 if the assembler should encode lfence, mfence, and sfence as
629 "lock addl $0, (%{re}sp)". */
630 static int avoid_fence = 0;
631
632 /* Type of the previous instruction. */
633 static struct
634 {
635 segT seg;
636 const char *file;
637 const char *name;
638 unsigned int line;
639 enum last_insn_kind
640 {
641 last_insn_other = 0,
642 last_insn_directive,
643 last_insn_prefix
644 } kind;
645 } last_insn;
646
647 /* 1 if the assembler should generate relax relocations. */
648
649 static int generate_relax_relocations
650 = DEFAULT_GENERATE_X86_RELAX_RELOCATIONS;
651
652 static enum check_kind
653 {
654 check_none = 0,
655 check_warning,
656 check_error
657 }
658 sse_check, operand_check = check_warning;
659
660 /* Non-zero if branches should be aligned within power of 2 boundary. */
661 static int align_branch_power = 0;
662
663 /* Types of branches to align. */
664 enum align_branch_kind
665 {
666 align_branch_none = 0,
667 align_branch_jcc = 1,
668 align_branch_fused = 2,
669 align_branch_jmp = 3,
670 align_branch_call = 4,
671 align_branch_indirect = 5,
672 align_branch_ret = 6
673 };
674
675 /* Type bits of branches to align. */
676 enum align_branch_bit
677 {
678 align_branch_jcc_bit = 1 << align_branch_jcc,
679 align_branch_fused_bit = 1 << align_branch_fused,
680 align_branch_jmp_bit = 1 << align_branch_jmp,
681 align_branch_call_bit = 1 << align_branch_call,
682 align_branch_indirect_bit = 1 << align_branch_indirect,
683 align_branch_ret_bit = 1 << align_branch_ret
684 };
685
686 static unsigned int align_branch = (align_branch_jcc_bit
687 | align_branch_fused_bit
688 | align_branch_jmp_bit);
689
690 /* The maximum padding size for fused jcc. CMP like instruction can
691 be 9 bytes and jcc can be 6 bytes. Leave room just in case for
692 prefixes. */
693 #define MAX_FUSED_JCC_PADDING_SIZE 20
694
695 /* The maximum number of prefixes added for an instruction. */
696 static unsigned int align_branch_prefix_size = 5;
697
698 /* Optimization:
699 1. Clear the REX_W bit with register operand if possible.
700 2. Above plus use 128bit vector instruction to clear the full vector
701 register.
702 */
703 static int optimize = 0;
704
705 /* Optimization:
706 1. Clear the REX_W bit with register operand if possible.
707 2. Above plus use 128bit vector instruction to clear the full vector
708 register.
709 3. Above plus optimize "test{q,l,w} $imm8,%r{64,32,16}" to
710 "testb $imm7,%r8".
711 */
712 static int optimize_for_space = 0;
713
714 /* Register prefix used for error message. */
715 static const char *register_prefix = "%";
716
717 /* Used in 16 bit gcc mode to add an l suffix to call, ret, enter,
718 leave, push, and pop instructions so that gcc has the same stack
719 frame as in 32 bit mode. */
720 static char stackop_size = '\0';
721
722 /* Non-zero to optimize code alignment. */
723 int optimize_align_code = 1;
724
725 /* Non-zero to quieten some warnings. */
726 static int quiet_warnings = 0;
727
728 /* CPU name. */
729 static const char *cpu_arch_name = NULL;
730 static char *cpu_sub_arch_name = NULL;
731
732 /* CPU feature flags. */
733 static i386_cpu_flags cpu_arch_flags = CPU_UNKNOWN_FLAGS;
734
735 /* If we have selected a cpu we are generating instructions for. */
736 static int cpu_arch_tune_set = 0;
737
738 /* Cpu we are generating instructions for. */
739 enum processor_type cpu_arch_tune = PROCESSOR_UNKNOWN;
740
741 /* CPU feature flags of cpu we are generating instructions for. */
742 static i386_cpu_flags cpu_arch_tune_flags;
743
744 /* CPU instruction set architecture used. */
745 enum processor_type cpu_arch_isa = PROCESSOR_UNKNOWN;
746
747 /* CPU feature flags of instruction set architecture used. */
748 i386_cpu_flags cpu_arch_isa_flags;
749
750 /* If set, conditional jumps are not automatically promoted to handle
751 larger than a byte offset. */
752 static unsigned int no_cond_jump_promotion = 0;
753
754 /* Encode SSE instructions with VEX prefix. */
755 static unsigned int sse2avx;
756
757 /* Encode scalar AVX instructions with specific vector length. */
758 static enum
759 {
760 vex128 = 0,
761 vex256
762 } avxscalar;
763
764 /* Encode VEX WIG instructions with specific vex.w. */
765 static enum
766 {
767 vexw0 = 0,
768 vexw1
769 } vexwig;
770
771 /* Encode scalar EVEX LIG instructions with specific vector length. */
772 static enum
773 {
774 evexl128 = 0,
775 evexl256,
776 evexl512
777 } evexlig;
778
779 /* Encode EVEX WIG instructions with specific evex.w. */
780 static enum
781 {
782 evexw0 = 0,
783 evexw1
784 } evexwig;
785
786 /* Value to encode in EVEX RC bits, for SAE-only instructions. */
787 static enum rc_type evexrcig = rne;
788
789 /* Pre-defined "_GLOBAL_OFFSET_TABLE_". */
790 static symbolS *GOT_symbol;
791
792 /* The dwarf2 return column, adjusted for 32 or 64 bit. */
793 unsigned int x86_dwarf2_return_column;
794
795 /* The dwarf2 data alignment, adjusted for 32 or 64 bit. */
796 int x86_cie_data_alignment;
797
798 /* Interface to relax_segment.
799 There are 3 major relax states for 386 jump insns because the
800 different types of jumps add different sizes to frags when we're
801 figuring out what sort of jump to choose to reach a given label.
802
803 BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING are used to align
804 branches which are handled by md_estimate_size_before_relax() and
805 i386_generic_table_relax_frag(). */
806
807 /* Types. */
808 #define UNCOND_JUMP 0
809 #define COND_JUMP 1
810 #define COND_JUMP86 2
811 #define BRANCH_PADDING 3
812 #define BRANCH_PREFIX 4
813 #define FUSED_JCC_PADDING 5
814
815 /* Sizes. */
816 #define CODE16 1
817 #define SMALL 0
818 #define SMALL16 (SMALL | CODE16)
819 #define BIG 2
820 #define BIG16 (BIG | CODE16)
821
822 #ifndef INLINE
823 #ifdef __GNUC__
824 #define INLINE __inline__
825 #else
826 #define INLINE
827 #endif
828 #endif
829
830 #define ENCODE_RELAX_STATE(type, size) \
831 ((relax_substateT) (((type) << 2) | (size)))
832 #define TYPE_FROM_RELAX_STATE(s) \
833 ((s) >> 2)
834 #define DISP_SIZE_FROM_RELAX_STATE(s) \
835 ((((s) & 3) == BIG ? 4 : (((s) & 3) == BIG16 ? 2 : 1)))
836
837 /* This table is used by relax_frag to promote short jumps to long
838 ones where necessary. SMALL (short) jumps may be promoted to BIG
839 (32 bit long) ones, and SMALL16 jumps to BIG16 (16 bit long). We
840 don't allow a short jump in a 32 bit code segment to be promoted to
841 a 16 bit offset jump because it's slower (requires data size
842 prefix), and doesn't work, unless the destination is in the bottom
843 64k of the code segment (The top 16 bits of eip are zeroed). */
844
845 const relax_typeS md_relax_table[] =
846 {
847 /* The fields are:
848 1) most positive reach of this state,
849 2) most negative reach of this state,
850 3) how many bytes this mode will have in the variable part of the frag
851 4) which index into the table to try if we can't fit into this one. */
852
853 /* UNCOND_JUMP states. */
854 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG)},
855 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16)},
856 /* dword jmp adds 4 bytes to frag:
857 0 extra opcode bytes, 4 displacement bytes. */
858 {0, 0, 4, 0},
859 /* word jmp adds 2 byte2 to frag:
860 0 extra opcode bytes, 2 displacement bytes. */
861 {0, 0, 2, 0},
862
863 /* COND_JUMP states. */
864 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG)},
865 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG16)},
866 /* dword conditionals adds 5 bytes to frag:
867 1 extra opcode byte, 4 displacement bytes. */
868 {0, 0, 5, 0},
869 /* word conditionals add 3 bytes to frag:
870 1 extra opcode byte, 2 displacement bytes. */
871 {0, 0, 3, 0},
872
873 /* COND_JUMP86 states. */
874 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG)},
875 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG16)},
876 /* dword conditionals adds 5 bytes to frag:
877 1 extra opcode byte, 4 displacement bytes. */
878 {0, 0, 5, 0},
879 /* word conditionals add 4 bytes to frag:
880 1 displacement byte and a 3 byte long branch insn. */
881 {0, 0, 4, 0}
882 };
883
884 static const arch_entry cpu_arch[] =
885 {
886 /* Do not replace the first two entries - i386_target_format()
887 relies on them being there in this order. */
888 { STRING_COMMA_LEN ("generic32"), PROCESSOR_GENERIC32,
889 CPU_GENERIC32_FLAGS, 0 },
890 { STRING_COMMA_LEN ("generic64"), PROCESSOR_GENERIC64,
891 CPU_GENERIC64_FLAGS, 0 },
892 { STRING_COMMA_LEN ("i8086"), PROCESSOR_UNKNOWN,
893 CPU_NONE_FLAGS, 0 },
894 { STRING_COMMA_LEN ("i186"), PROCESSOR_UNKNOWN,
895 CPU_I186_FLAGS, 0 },
896 { STRING_COMMA_LEN ("i286"), PROCESSOR_UNKNOWN,
897 CPU_I286_FLAGS, 0 },
898 { STRING_COMMA_LEN ("i386"), PROCESSOR_I386,
899 CPU_I386_FLAGS, 0 },
900 { STRING_COMMA_LEN ("i486"), PROCESSOR_I486,
901 CPU_I486_FLAGS, 0 },
902 { STRING_COMMA_LEN ("i586"), PROCESSOR_PENTIUM,
903 CPU_I586_FLAGS, 0 },
904 { STRING_COMMA_LEN ("i686"), PROCESSOR_PENTIUMPRO,
905 CPU_I686_FLAGS, 0 },
906 { STRING_COMMA_LEN ("pentium"), PROCESSOR_PENTIUM,
907 CPU_I586_FLAGS, 0 },
908 { STRING_COMMA_LEN ("pentiumpro"), PROCESSOR_PENTIUMPRO,
909 CPU_PENTIUMPRO_FLAGS, 0 },
910 { STRING_COMMA_LEN ("pentiumii"), PROCESSOR_PENTIUMPRO,
911 CPU_P2_FLAGS, 0 },
912 { STRING_COMMA_LEN ("pentiumiii"),PROCESSOR_PENTIUMPRO,
913 CPU_P3_FLAGS, 0 },
914 { STRING_COMMA_LEN ("pentium4"), PROCESSOR_PENTIUM4,
915 CPU_P4_FLAGS, 0 },
916 { STRING_COMMA_LEN ("prescott"), PROCESSOR_NOCONA,
917 CPU_CORE_FLAGS, 0 },
918 { STRING_COMMA_LEN ("nocona"), PROCESSOR_NOCONA,
919 CPU_NOCONA_FLAGS, 0 },
920 { STRING_COMMA_LEN ("yonah"), PROCESSOR_CORE,
921 CPU_CORE_FLAGS, 1 },
922 { STRING_COMMA_LEN ("core"), PROCESSOR_CORE,
923 CPU_CORE_FLAGS, 0 },
924 { STRING_COMMA_LEN ("merom"), PROCESSOR_CORE2,
925 CPU_CORE2_FLAGS, 1 },
926 { STRING_COMMA_LEN ("core2"), PROCESSOR_CORE2,
927 CPU_CORE2_FLAGS, 0 },
928 { STRING_COMMA_LEN ("corei7"), PROCESSOR_COREI7,
929 CPU_COREI7_FLAGS, 0 },
930 { STRING_COMMA_LEN ("l1om"), PROCESSOR_L1OM,
931 CPU_L1OM_FLAGS, 0 },
932 { STRING_COMMA_LEN ("k1om"), PROCESSOR_K1OM,
933 CPU_K1OM_FLAGS, 0 },
934 { STRING_COMMA_LEN ("iamcu"), PROCESSOR_IAMCU,
935 CPU_IAMCU_FLAGS, 0 },
936 { STRING_COMMA_LEN ("k6"), PROCESSOR_K6,
937 CPU_K6_FLAGS, 0 },
938 { STRING_COMMA_LEN ("k6_2"), PROCESSOR_K6,
939 CPU_K6_2_FLAGS, 0 },
940 { STRING_COMMA_LEN ("athlon"), PROCESSOR_ATHLON,
941 CPU_ATHLON_FLAGS, 0 },
942 { STRING_COMMA_LEN ("sledgehammer"), PROCESSOR_K8,
943 CPU_K8_FLAGS, 1 },
944 { STRING_COMMA_LEN ("opteron"), PROCESSOR_K8,
945 CPU_K8_FLAGS, 0 },
946 { STRING_COMMA_LEN ("k8"), PROCESSOR_K8,
947 CPU_K8_FLAGS, 0 },
948 { STRING_COMMA_LEN ("amdfam10"), PROCESSOR_AMDFAM10,
949 CPU_AMDFAM10_FLAGS, 0 },
950 { STRING_COMMA_LEN ("bdver1"), PROCESSOR_BD,
951 CPU_BDVER1_FLAGS, 0 },
952 { STRING_COMMA_LEN ("bdver2"), PROCESSOR_BD,
953 CPU_BDVER2_FLAGS, 0 },
954 { STRING_COMMA_LEN ("bdver3"), PROCESSOR_BD,
955 CPU_BDVER3_FLAGS, 0 },
956 { STRING_COMMA_LEN ("bdver4"), PROCESSOR_BD,
957 CPU_BDVER4_FLAGS, 0 },
958 { STRING_COMMA_LEN ("znver1"), PROCESSOR_ZNVER,
959 CPU_ZNVER1_FLAGS, 0 },
960 { STRING_COMMA_LEN ("znver2"), PROCESSOR_ZNVER,
961 CPU_ZNVER2_FLAGS, 0 },
962 { STRING_COMMA_LEN ("btver1"), PROCESSOR_BT,
963 CPU_BTVER1_FLAGS, 0 },
964 { STRING_COMMA_LEN ("btver2"), PROCESSOR_BT,
965 CPU_BTVER2_FLAGS, 0 },
966 { STRING_COMMA_LEN (".8087"), PROCESSOR_UNKNOWN,
967 CPU_8087_FLAGS, 0 },
968 { STRING_COMMA_LEN (".287"), PROCESSOR_UNKNOWN,
969 CPU_287_FLAGS, 0 },
970 { STRING_COMMA_LEN (".387"), PROCESSOR_UNKNOWN,
971 CPU_387_FLAGS, 0 },
972 { STRING_COMMA_LEN (".687"), PROCESSOR_UNKNOWN,
973 CPU_687_FLAGS, 0 },
974 { STRING_COMMA_LEN (".cmov"), PROCESSOR_UNKNOWN,
975 CPU_CMOV_FLAGS, 0 },
976 { STRING_COMMA_LEN (".fxsr"), PROCESSOR_UNKNOWN,
977 CPU_FXSR_FLAGS, 0 },
978 { STRING_COMMA_LEN (".mmx"), PROCESSOR_UNKNOWN,
979 CPU_MMX_FLAGS, 0 },
980 { STRING_COMMA_LEN (".sse"), PROCESSOR_UNKNOWN,
981 CPU_SSE_FLAGS, 0 },
982 { STRING_COMMA_LEN (".sse2"), PROCESSOR_UNKNOWN,
983 CPU_SSE2_FLAGS, 0 },
984 { STRING_COMMA_LEN (".sse3"), PROCESSOR_UNKNOWN,
985 CPU_SSE3_FLAGS, 0 },
986 { STRING_COMMA_LEN (".ssse3"), PROCESSOR_UNKNOWN,
987 CPU_SSSE3_FLAGS, 0 },
988 { STRING_COMMA_LEN (".sse4.1"), PROCESSOR_UNKNOWN,
989 CPU_SSE4_1_FLAGS, 0 },
990 { STRING_COMMA_LEN (".sse4.2"), PROCESSOR_UNKNOWN,
991 CPU_SSE4_2_FLAGS, 0 },
992 { STRING_COMMA_LEN (".sse4"), PROCESSOR_UNKNOWN,
993 CPU_SSE4_2_FLAGS, 0 },
994 { STRING_COMMA_LEN (".avx"), PROCESSOR_UNKNOWN,
995 CPU_AVX_FLAGS, 0 },
996 { STRING_COMMA_LEN (".avx2"), PROCESSOR_UNKNOWN,
997 CPU_AVX2_FLAGS, 0 },
998 { STRING_COMMA_LEN (".avx512f"), PROCESSOR_UNKNOWN,
999 CPU_AVX512F_FLAGS, 0 },
1000 { STRING_COMMA_LEN (".avx512cd"), PROCESSOR_UNKNOWN,
1001 CPU_AVX512CD_FLAGS, 0 },
1002 { STRING_COMMA_LEN (".avx512er"), PROCESSOR_UNKNOWN,
1003 CPU_AVX512ER_FLAGS, 0 },
1004 { STRING_COMMA_LEN (".avx512pf"), PROCESSOR_UNKNOWN,
1005 CPU_AVX512PF_FLAGS, 0 },
1006 { STRING_COMMA_LEN (".avx512dq"), PROCESSOR_UNKNOWN,
1007 CPU_AVX512DQ_FLAGS, 0 },
1008 { STRING_COMMA_LEN (".avx512bw"), PROCESSOR_UNKNOWN,
1009 CPU_AVX512BW_FLAGS, 0 },
1010 { STRING_COMMA_LEN (".avx512vl"), PROCESSOR_UNKNOWN,
1011 CPU_AVX512VL_FLAGS, 0 },
1012 { STRING_COMMA_LEN (".vmx"), PROCESSOR_UNKNOWN,
1013 CPU_VMX_FLAGS, 0 },
1014 { STRING_COMMA_LEN (".vmfunc"), PROCESSOR_UNKNOWN,
1015 CPU_VMFUNC_FLAGS, 0 },
1016 { STRING_COMMA_LEN (".smx"), PROCESSOR_UNKNOWN,
1017 CPU_SMX_FLAGS, 0 },
1018 { STRING_COMMA_LEN (".xsave"), PROCESSOR_UNKNOWN,
1019 CPU_XSAVE_FLAGS, 0 },
1020 { STRING_COMMA_LEN (".xsaveopt"), PROCESSOR_UNKNOWN,
1021 CPU_XSAVEOPT_FLAGS, 0 },
1022 { STRING_COMMA_LEN (".xsavec"), PROCESSOR_UNKNOWN,
1023 CPU_XSAVEC_FLAGS, 0 },
1024 { STRING_COMMA_LEN (".xsaves"), PROCESSOR_UNKNOWN,
1025 CPU_XSAVES_FLAGS, 0 },
1026 { STRING_COMMA_LEN (".aes"), PROCESSOR_UNKNOWN,
1027 CPU_AES_FLAGS, 0 },
1028 { STRING_COMMA_LEN (".pclmul"), PROCESSOR_UNKNOWN,
1029 CPU_PCLMUL_FLAGS, 0 },
1030 { STRING_COMMA_LEN (".clmul"), PROCESSOR_UNKNOWN,
1031 CPU_PCLMUL_FLAGS, 1 },
1032 { STRING_COMMA_LEN (".fsgsbase"), PROCESSOR_UNKNOWN,
1033 CPU_FSGSBASE_FLAGS, 0 },
1034 { STRING_COMMA_LEN (".rdrnd"), PROCESSOR_UNKNOWN,
1035 CPU_RDRND_FLAGS, 0 },
1036 { STRING_COMMA_LEN (".f16c"), PROCESSOR_UNKNOWN,
1037 CPU_F16C_FLAGS, 0 },
1038 { STRING_COMMA_LEN (".bmi2"), PROCESSOR_UNKNOWN,
1039 CPU_BMI2_FLAGS, 0 },
1040 { STRING_COMMA_LEN (".fma"), PROCESSOR_UNKNOWN,
1041 CPU_FMA_FLAGS, 0 },
1042 { STRING_COMMA_LEN (".fma4"), PROCESSOR_UNKNOWN,
1043 CPU_FMA4_FLAGS, 0 },
1044 { STRING_COMMA_LEN (".xop"), PROCESSOR_UNKNOWN,
1045 CPU_XOP_FLAGS, 0 },
1046 { STRING_COMMA_LEN (".lwp"), PROCESSOR_UNKNOWN,
1047 CPU_LWP_FLAGS, 0 },
1048 { STRING_COMMA_LEN (".movbe"), PROCESSOR_UNKNOWN,
1049 CPU_MOVBE_FLAGS, 0 },
1050 { STRING_COMMA_LEN (".cx16"), PROCESSOR_UNKNOWN,
1051 CPU_CX16_FLAGS, 0 },
1052 { STRING_COMMA_LEN (".ept"), PROCESSOR_UNKNOWN,
1053 CPU_EPT_FLAGS, 0 },
1054 { STRING_COMMA_LEN (".lzcnt"), PROCESSOR_UNKNOWN,
1055 CPU_LZCNT_FLAGS, 0 },
1056 { STRING_COMMA_LEN (".hle"), PROCESSOR_UNKNOWN,
1057 CPU_HLE_FLAGS, 0 },
1058 { STRING_COMMA_LEN (".rtm"), PROCESSOR_UNKNOWN,
1059 CPU_RTM_FLAGS, 0 },
1060 { STRING_COMMA_LEN (".invpcid"), PROCESSOR_UNKNOWN,
1061 CPU_INVPCID_FLAGS, 0 },
1062 { STRING_COMMA_LEN (".clflush"), PROCESSOR_UNKNOWN,
1063 CPU_CLFLUSH_FLAGS, 0 },
1064 { STRING_COMMA_LEN (".nop"), PROCESSOR_UNKNOWN,
1065 CPU_NOP_FLAGS, 0 },
1066 { STRING_COMMA_LEN (".syscall"), PROCESSOR_UNKNOWN,
1067 CPU_SYSCALL_FLAGS, 0 },
1068 { STRING_COMMA_LEN (".rdtscp"), PROCESSOR_UNKNOWN,
1069 CPU_RDTSCP_FLAGS, 0 },
1070 { STRING_COMMA_LEN (".3dnow"), PROCESSOR_UNKNOWN,
1071 CPU_3DNOW_FLAGS, 0 },
1072 { STRING_COMMA_LEN (".3dnowa"), PROCESSOR_UNKNOWN,
1073 CPU_3DNOWA_FLAGS, 0 },
1074 { STRING_COMMA_LEN (".padlock"), PROCESSOR_UNKNOWN,
1075 CPU_PADLOCK_FLAGS, 0 },
1076 { STRING_COMMA_LEN (".pacifica"), PROCESSOR_UNKNOWN,
1077 CPU_SVME_FLAGS, 1 },
1078 { STRING_COMMA_LEN (".svme"), PROCESSOR_UNKNOWN,
1079 CPU_SVME_FLAGS, 0 },
1080 { STRING_COMMA_LEN (".sse4a"), PROCESSOR_UNKNOWN,
1081 CPU_SSE4A_FLAGS, 0 },
1082 { STRING_COMMA_LEN (".abm"), PROCESSOR_UNKNOWN,
1083 CPU_ABM_FLAGS, 0 },
1084 { STRING_COMMA_LEN (".bmi"), PROCESSOR_UNKNOWN,
1085 CPU_BMI_FLAGS, 0 },
1086 { STRING_COMMA_LEN (".tbm"), PROCESSOR_UNKNOWN,
1087 CPU_TBM_FLAGS, 0 },
1088 { STRING_COMMA_LEN (".adx"), PROCESSOR_UNKNOWN,
1089 CPU_ADX_FLAGS, 0 },
1090 { STRING_COMMA_LEN (".rdseed"), PROCESSOR_UNKNOWN,
1091 CPU_RDSEED_FLAGS, 0 },
1092 { STRING_COMMA_LEN (".prfchw"), PROCESSOR_UNKNOWN,
1093 CPU_PRFCHW_FLAGS, 0 },
1094 { STRING_COMMA_LEN (".smap"), PROCESSOR_UNKNOWN,
1095 CPU_SMAP_FLAGS, 0 },
1096 { STRING_COMMA_LEN (".mpx"), PROCESSOR_UNKNOWN,
1097 CPU_MPX_FLAGS, 0 },
1098 { STRING_COMMA_LEN (".sha"), PROCESSOR_UNKNOWN,
1099 CPU_SHA_FLAGS, 0 },
1100 { STRING_COMMA_LEN (".clflushopt"), PROCESSOR_UNKNOWN,
1101 CPU_CLFLUSHOPT_FLAGS, 0 },
1102 { STRING_COMMA_LEN (".prefetchwt1"), PROCESSOR_UNKNOWN,
1103 CPU_PREFETCHWT1_FLAGS, 0 },
1104 { STRING_COMMA_LEN (".se1"), PROCESSOR_UNKNOWN,
1105 CPU_SE1_FLAGS, 0 },
1106 { STRING_COMMA_LEN (".clwb"), PROCESSOR_UNKNOWN,
1107 CPU_CLWB_FLAGS, 0 },
1108 { STRING_COMMA_LEN (".avx512ifma"), PROCESSOR_UNKNOWN,
1109 CPU_AVX512IFMA_FLAGS, 0 },
1110 { STRING_COMMA_LEN (".avx512vbmi"), PROCESSOR_UNKNOWN,
1111 CPU_AVX512VBMI_FLAGS, 0 },
1112 { STRING_COMMA_LEN (".avx512_4fmaps"), PROCESSOR_UNKNOWN,
1113 CPU_AVX512_4FMAPS_FLAGS, 0 },
1114 { STRING_COMMA_LEN (".avx512_4vnniw"), PROCESSOR_UNKNOWN,
1115 CPU_AVX512_4VNNIW_FLAGS, 0 },
1116 { STRING_COMMA_LEN (".avx512_vpopcntdq"), PROCESSOR_UNKNOWN,
1117 CPU_AVX512_VPOPCNTDQ_FLAGS, 0 },
1118 { STRING_COMMA_LEN (".avx512_vbmi2"), PROCESSOR_UNKNOWN,
1119 CPU_AVX512_VBMI2_FLAGS, 0 },
1120 { STRING_COMMA_LEN (".avx512_vnni"), PROCESSOR_UNKNOWN,
1121 CPU_AVX512_VNNI_FLAGS, 0 },
1122 { STRING_COMMA_LEN (".avx512_bitalg"), PROCESSOR_UNKNOWN,
1123 CPU_AVX512_BITALG_FLAGS, 0 },
1124 { STRING_COMMA_LEN (".clzero"), PROCESSOR_UNKNOWN,
1125 CPU_CLZERO_FLAGS, 0 },
1126 { STRING_COMMA_LEN (".mwaitx"), PROCESSOR_UNKNOWN,
1127 CPU_MWAITX_FLAGS, 0 },
1128 { STRING_COMMA_LEN (".ospke"), PROCESSOR_UNKNOWN,
1129 CPU_OSPKE_FLAGS, 0 },
1130 { STRING_COMMA_LEN (".rdpid"), PROCESSOR_UNKNOWN,
1131 CPU_RDPID_FLAGS, 0 },
1132 { STRING_COMMA_LEN (".ptwrite"), PROCESSOR_UNKNOWN,
1133 CPU_PTWRITE_FLAGS, 0 },
1134 { STRING_COMMA_LEN (".ibt"), PROCESSOR_UNKNOWN,
1135 CPU_IBT_FLAGS, 0 },
1136 { STRING_COMMA_LEN (".shstk"), PROCESSOR_UNKNOWN,
1137 CPU_SHSTK_FLAGS, 0 },
1138 { STRING_COMMA_LEN (".gfni"), PROCESSOR_UNKNOWN,
1139 CPU_GFNI_FLAGS, 0 },
1140 { STRING_COMMA_LEN (".vaes"), PROCESSOR_UNKNOWN,
1141 CPU_VAES_FLAGS, 0 },
1142 { STRING_COMMA_LEN (".vpclmulqdq"), PROCESSOR_UNKNOWN,
1143 CPU_VPCLMULQDQ_FLAGS, 0 },
1144 { STRING_COMMA_LEN (".wbnoinvd"), PROCESSOR_UNKNOWN,
1145 CPU_WBNOINVD_FLAGS, 0 },
1146 { STRING_COMMA_LEN (".pconfig"), PROCESSOR_UNKNOWN,
1147 CPU_PCONFIG_FLAGS, 0 },
1148 { STRING_COMMA_LEN (".waitpkg"), PROCESSOR_UNKNOWN,
1149 CPU_WAITPKG_FLAGS, 0 },
1150 { STRING_COMMA_LEN (".cldemote"), PROCESSOR_UNKNOWN,
1151 CPU_CLDEMOTE_FLAGS, 0 },
1152 { STRING_COMMA_LEN (".movdiri"), PROCESSOR_UNKNOWN,
1153 CPU_MOVDIRI_FLAGS, 0 },
1154 { STRING_COMMA_LEN (".movdir64b"), PROCESSOR_UNKNOWN,
1155 CPU_MOVDIR64B_FLAGS, 0 },
1156 { STRING_COMMA_LEN (".avx512_bf16"), PROCESSOR_UNKNOWN,
1157 CPU_AVX512_BF16_FLAGS, 0 },
1158 { STRING_COMMA_LEN (".avx512_vp2intersect"), PROCESSOR_UNKNOWN,
1159 CPU_AVX512_VP2INTERSECT_FLAGS, 0 },
1160 { STRING_COMMA_LEN (".enqcmd"), PROCESSOR_UNKNOWN,
1161 CPU_ENQCMD_FLAGS, 0 },
1162 { STRING_COMMA_LEN (".rdpru"), PROCESSOR_UNKNOWN,
1163 CPU_RDPRU_FLAGS, 0 },
1164 { STRING_COMMA_LEN (".mcommit"), PROCESSOR_UNKNOWN,
1165 CPU_MCOMMIT_FLAGS, 0 },
1166 };
1167
1168 static const noarch_entry cpu_noarch[] =
1169 {
1170 { STRING_COMMA_LEN ("no87"), CPU_ANY_X87_FLAGS },
1171 { STRING_COMMA_LEN ("no287"), CPU_ANY_287_FLAGS },
1172 { STRING_COMMA_LEN ("no387"), CPU_ANY_387_FLAGS },
1173 { STRING_COMMA_LEN ("no687"), CPU_ANY_687_FLAGS },
1174 { STRING_COMMA_LEN ("nocmov"), CPU_ANY_CMOV_FLAGS },
1175 { STRING_COMMA_LEN ("nofxsr"), CPU_ANY_FXSR_FLAGS },
1176 { STRING_COMMA_LEN ("nommx"), CPU_ANY_MMX_FLAGS },
1177 { STRING_COMMA_LEN ("nosse"), CPU_ANY_SSE_FLAGS },
1178 { STRING_COMMA_LEN ("nosse2"), CPU_ANY_SSE2_FLAGS },
1179 { STRING_COMMA_LEN ("nosse3"), CPU_ANY_SSE3_FLAGS },
1180 { STRING_COMMA_LEN ("nossse3"), CPU_ANY_SSSE3_FLAGS },
1181 { STRING_COMMA_LEN ("nosse4.1"), CPU_ANY_SSE4_1_FLAGS },
1182 { STRING_COMMA_LEN ("nosse4.2"), CPU_ANY_SSE4_2_FLAGS },
1183 { STRING_COMMA_LEN ("nosse4"), CPU_ANY_SSE4_FLAGS },
1184 { STRING_COMMA_LEN ("noavx"), CPU_ANY_AVX_FLAGS },
1185 { STRING_COMMA_LEN ("noavx2"), CPU_ANY_AVX2_FLAGS },
1186 { STRING_COMMA_LEN ("noavx512f"), CPU_ANY_AVX512F_FLAGS },
1187 { STRING_COMMA_LEN ("noavx512cd"), CPU_ANY_AVX512CD_FLAGS },
1188 { STRING_COMMA_LEN ("noavx512er"), CPU_ANY_AVX512ER_FLAGS },
1189 { STRING_COMMA_LEN ("noavx512pf"), CPU_ANY_AVX512PF_FLAGS },
1190 { STRING_COMMA_LEN ("noavx512dq"), CPU_ANY_AVX512DQ_FLAGS },
1191 { STRING_COMMA_LEN ("noavx512bw"), CPU_ANY_AVX512BW_FLAGS },
1192 { STRING_COMMA_LEN ("noavx512vl"), CPU_ANY_AVX512VL_FLAGS },
1193 { STRING_COMMA_LEN ("noavx512ifma"), CPU_ANY_AVX512IFMA_FLAGS },
1194 { STRING_COMMA_LEN ("noavx512vbmi"), CPU_ANY_AVX512VBMI_FLAGS },
1195 { STRING_COMMA_LEN ("noavx512_4fmaps"), CPU_ANY_AVX512_4FMAPS_FLAGS },
1196 { STRING_COMMA_LEN ("noavx512_4vnniw"), CPU_ANY_AVX512_4VNNIW_FLAGS },
1197 { STRING_COMMA_LEN ("noavx512_vpopcntdq"), CPU_ANY_AVX512_VPOPCNTDQ_FLAGS },
1198 { STRING_COMMA_LEN ("noavx512_vbmi2"), CPU_ANY_AVX512_VBMI2_FLAGS },
1199 { STRING_COMMA_LEN ("noavx512_vnni"), CPU_ANY_AVX512_VNNI_FLAGS },
1200 { STRING_COMMA_LEN ("noavx512_bitalg"), CPU_ANY_AVX512_BITALG_FLAGS },
1201 { STRING_COMMA_LEN ("noibt"), CPU_ANY_IBT_FLAGS },
1202 { STRING_COMMA_LEN ("noshstk"), CPU_ANY_SHSTK_FLAGS },
1203 { STRING_COMMA_LEN ("nomovdiri"), CPU_ANY_MOVDIRI_FLAGS },
1204 { STRING_COMMA_LEN ("nomovdir64b"), CPU_ANY_MOVDIR64B_FLAGS },
1205 { STRING_COMMA_LEN ("noavx512_bf16"), CPU_ANY_AVX512_BF16_FLAGS },
1206 { STRING_COMMA_LEN ("noavx512_vp2intersect"), CPU_ANY_SHSTK_FLAGS },
1207 { STRING_COMMA_LEN ("noenqcmd"), CPU_ANY_ENQCMD_FLAGS },
1208 };
1209
1210 #ifdef I386COFF
1211 /* Like s_lcomm_internal in gas/read.c but the alignment string
1212 is allowed to be optional. */
1213
1214 static symbolS *
1215 pe_lcomm_internal (int needs_align, symbolS *symbolP, addressT size)
1216 {
1217 addressT align = 0;
1218
1219 SKIP_WHITESPACE ();
1220
1221 if (needs_align
1222 && *input_line_pointer == ',')
1223 {
1224 align = parse_align (needs_align - 1);
1225
1226 if (align == (addressT) -1)
1227 return NULL;
1228 }
1229 else
1230 {
1231 if (size >= 8)
1232 align = 3;
1233 else if (size >= 4)
1234 align = 2;
1235 else if (size >= 2)
1236 align = 1;
1237 else
1238 align = 0;
1239 }
1240
1241 bss_alloc (symbolP, size, align);
1242 return symbolP;
1243 }
1244
1245 static void
1246 pe_lcomm (int needs_align)
1247 {
1248 s_comm_internal (needs_align * 2, pe_lcomm_internal);
1249 }
1250 #endif
1251
1252 const pseudo_typeS md_pseudo_table[] =
1253 {
1254 #if !defined(OBJ_AOUT) && !defined(USE_ALIGN_PTWO)
1255 {"align", s_align_bytes, 0},
1256 #else
1257 {"align", s_align_ptwo, 0},
1258 #endif
1259 {"arch", set_cpu_arch, 0},
1260 #ifndef I386COFF
1261 {"bss", s_bss, 0},
1262 #else
1263 {"lcomm", pe_lcomm, 1},
1264 #endif
1265 {"ffloat", float_cons, 'f'},
1266 {"dfloat", float_cons, 'd'},
1267 {"tfloat", float_cons, 'x'},
1268 {"value", cons, 2},
1269 {"slong", signed_cons, 4},
1270 {"noopt", s_ignore, 0},
1271 {"optim", s_ignore, 0},
1272 {"code16gcc", set_16bit_gcc_code_flag, CODE_16BIT},
1273 {"code16", set_code_flag, CODE_16BIT},
1274 {"code32", set_code_flag, CODE_32BIT},
1275 #ifdef BFD64
1276 {"code64", set_code_flag, CODE_64BIT},
1277 #endif
1278 {"intel_syntax", set_intel_syntax, 1},
1279 {"att_syntax", set_intel_syntax, 0},
1280 {"intel_mnemonic", set_intel_mnemonic, 1},
1281 {"att_mnemonic", set_intel_mnemonic, 0},
1282 {"allow_index_reg", set_allow_index_reg, 1},
1283 {"disallow_index_reg", set_allow_index_reg, 0},
1284 {"sse_check", set_check, 0},
1285 {"operand_check", set_check, 1},
1286 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
1287 {"largecomm", handle_large_common, 0},
1288 #else
1289 {"file", dwarf2_directive_file, 0},
1290 {"loc", dwarf2_directive_loc, 0},
1291 {"loc_mark_labels", dwarf2_directive_loc_mark_labels, 0},
1292 #endif
1293 #ifdef TE_PE
1294 {"secrel32", pe_directive_secrel, 0},
1295 #endif
1296 {0, 0, 0}
1297 };
1298
1299 /* For interface with expression (). */
1300 extern char *input_line_pointer;
1301
1302 /* Hash table for instruction mnemonic lookup. */
1303 static struct hash_control *op_hash;
1304
1305 /* Hash table for register lookup. */
1306 static struct hash_control *reg_hash;
1307 \f
1308 /* Various efficient no-op patterns for aligning code labels.
1309 Note: Don't try to assemble the instructions in the comments.
1310 0L and 0w are not legal. */
1311 static const unsigned char f32_1[] =
1312 {0x90}; /* nop */
1313 static const unsigned char f32_2[] =
1314 {0x66,0x90}; /* xchg %ax,%ax */
1315 static const unsigned char f32_3[] =
1316 {0x8d,0x76,0x00}; /* leal 0(%esi),%esi */
1317 static const unsigned char f32_4[] =
1318 {0x8d,0x74,0x26,0x00}; /* leal 0(%esi,1),%esi */
1319 static const unsigned char f32_6[] =
1320 {0x8d,0xb6,0x00,0x00,0x00,0x00}; /* leal 0L(%esi),%esi */
1321 static const unsigned char f32_7[] =
1322 {0x8d,0xb4,0x26,0x00,0x00,0x00,0x00}; /* leal 0L(%esi,1),%esi */
1323 static const unsigned char f16_3[] =
1324 {0x8d,0x74,0x00}; /* lea 0(%si),%si */
1325 static const unsigned char f16_4[] =
1326 {0x8d,0xb4,0x00,0x00}; /* lea 0W(%si),%si */
1327 static const unsigned char jump_disp8[] =
1328 {0xeb}; /* jmp disp8 */
1329 static const unsigned char jump32_disp32[] =
1330 {0xe9}; /* jmp disp32 */
1331 static const unsigned char jump16_disp32[] =
1332 {0x66,0xe9}; /* jmp disp32 */
1333 /* 32-bit NOPs patterns. */
1334 static const unsigned char *const f32_patt[] = {
1335 f32_1, f32_2, f32_3, f32_4, NULL, f32_6, f32_7
1336 };
1337 /* 16-bit NOPs patterns. */
1338 static const unsigned char *const f16_patt[] = {
1339 f32_1, f32_2, f16_3, f16_4
1340 };
1341 /* nopl (%[re]ax) */
1342 static const unsigned char alt_3[] =
1343 {0x0f,0x1f,0x00};
1344 /* nopl 0(%[re]ax) */
1345 static const unsigned char alt_4[] =
1346 {0x0f,0x1f,0x40,0x00};
1347 /* nopl 0(%[re]ax,%[re]ax,1) */
1348 static const unsigned char alt_5[] =
1349 {0x0f,0x1f,0x44,0x00,0x00};
1350 /* nopw 0(%[re]ax,%[re]ax,1) */
1351 static const unsigned char alt_6[] =
1352 {0x66,0x0f,0x1f,0x44,0x00,0x00};
1353 /* nopl 0L(%[re]ax) */
1354 static const unsigned char alt_7[] =
1355 {0x0f,0x1f,0x80,0x00,0x00,0x00,0x00};
1356 /* nopl 0L(%[re]ax,%[re]ax,1) */
1357 static const unsigned char alt_8[] =
1358 {0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1359 /* nopw 0L(%[re]ax,%[re]ax,1) */
1360 static const unsigned char alt_9[] =
1361 {0x66,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1362 /* nopw %cs:0L(%[re]ax,%[re]ax,1) */
1363 static const unsigned char alt_10[] =
1364 {0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1365 /* data16 nopw %cs:0L(%eax,%eax,1) */
1366 static const unsigned char alt_11[] =
1367 {0x66,0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1368 /* 32-bit and 64-bit NOPs patterns. */
1369 static const unsigned char *const alt_patt[] = {
1370 f32_1, f32_2, alt_3, alt_4, alt_5, alt_6, alt_7, alt_8,
1371 alt_9, alt_10, alt_11
1372 };
1373
1374 /* Genenerate COUNT bytes of NOPs to WHERE from PATT with the maximum
1375 size of a single NOP instruction MAX_SINGLE_NOP_SIZE. */
1376
1377 static void
1378 i386_output_nops (char *where, const unsigned char *const *patt,
1379 int count, int max_single_nop_size)
1380
1381 {
1382 /* Place the longer NOP first. */
1383 int last;
1384 int offset;
1385 const unsigned char *nops;
1386
1387 if (max_single_nop_size < 1)
1388 {
1389 as_fatal (_("i386_output_nops called to generate nops of at most %d bytes!"),
1390 max_single_nop_size);
1391 return;
1392 }
1393
1394 nops = patt[max_single_nop_size - 1];
1395
1396 /* Use the smaller one if the requsted one isn't available. */
1397 if (nops == NULL)
1398 {
1399 max_single_nop_size--;
1400 nops = patt[max_single_nop_size - 1];
1401 }
1402
1403 last = count % max_single_nop_size;
1404
1405 count -= last;
1406 for (offset = 0; offset < count; offset += max_single_nop_size)
1407 memcpy (where + offset, nops, max_single_nop_size);
1408
1409 if (last)
1410 {
1411 nops = patt[last - 1];
1412 if (nops == NULL)
1413 {
1414 /* Use the smaller one plus one-byte NOP if the needed one
1415 isn't available. */
1416 last--;
1417 nops = patt[last - 1];
1418 memcpy (where + offset, nops, last);
1419 where[offset + last] = *patt[0];
1420 }
1421 else
1422 memcpy (where + offset, nops, last);
1423 }
1424 }
1425
1426 static INLINE int
1427 fits_in_imm7 (offsetT num)
1428 {
1429 return (num & 0x7f) == num;
1430 }
1431
1432 static INLINE int
1433 fits_in_imm31 (offsetT num)
1434 {
1435 return (num & 0x7fffffff) == num;
1436 }
1437
1438 /* Genenerate COUNT bytes of NOPs to WHERE with the maximum size of a
1439 single NOP instruction LIMIT. */
1440
1441 void
1442 i386_generate_nops (fragS *fragP, char *where, offsetT count, int limit)
1443 {
1444 const unsigned char *const *patt = NULL;
1445 int max_single_nop_size;
1446 /* Maximum number of NOPs before switching to jump over NOPs. */
1447 int max_number_of_nops;
1448
1449 switch (fragP->fr_type)
1450 {
1451 case rs_fill_nop:
1452 case rs_align_code:
1453 break;
1454 case rs_machine_dependent:
1455 /* Allow NOP padding for jumps and calls. */
1456 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
1457 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
1458 break;
1459 /* Fall through. */
1460 default:
1461 return;
1462 }
1463
1464 /* We need to decide which NOP sequence to use for 32bit and
1465 64bit. When -mtune= is used:
1466
1467 1. For PROCESSOR_I386, PROCESSOR_I486, PROCESSOR_PENTIUM and
1468 PROCESSOR_GENERIC32, f32_patt will be used.
1469 2. For the rest, alt_patt will be used.
1470
1471 When -mtune= isn't used, alt_patt will be used if
1472 cpu_arch_isa_flags has CpuNop. Otherwise, f32_patt will
1473 be used.
1474
1475 When -march= or .arch is used, we can't use anything beyond
1476 cpu_arch_isa_flags. */
1477
1478 if (flag_code == CODE_16BIT)
1479 {
1480 patt = f16_patt;
1481 max_single_nop_size = sizeof (f16_patt) / sizeof (f16_patt[0]);
1482 /* Limit number of NOPs to 2 in 16-bit mode. */
1483 max_number_of_nops = 2;
1484 }
1485 else
1486 {
1487 if (fragP->tc_frag_data.isa == PROCESSOR_UNKNOWN)
1488 {
1489 /* PROCESSOR_UNKNOWN means that all ISAs may be used. */
1490 switch (cpu_arch_tune)
1491 {
1492 case PROCESSOR_UNKNOWN:
1493 /* We use cpu_arch_isa_flags to check if we SHOULD
1494 optimize with nops. */
1495 if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1496 patt = alt_patt;
1497 else
1498 patt = f32_patt;
1499 break;
1500 case PROCESSOR_PENTIUM4:
1501 case PROCESSOR_NOCONA:
1502 case PROCESSOR_CORE:
1503 case PROCESSOR_CORE2:
1504 case PROCESSOR_COREI7:
1505 case PROCESSOR_L1OM:
1506 case PROCESSOR_K1OM:
1507 case PROCESSOR_GENERIC64:
1508 case PROCESSOR_K6:
1509 case PROCESSOR_ATHLON:
1510 case PROCESSOR_K8:
1511 case PROCESSOR_AMDFAM10:
1512 case PROCESSOR_BD:
1513 case PROCESSOR_ZNVER:
1514 case PROCESSOR_BT:
1515 patt = alt_patt;
1516 break;
1517 case PROCESSOR_I386:
1518 case PROCESSOR_I486:
1519 case PROCESSOR_PENTIUM:
1520 case PROCESSOR_PENTIUMPRO:
1521 case PROCESSOR_IAMCU:
1522 case PROCESSOR_GENERIC32:
1523 patt = f32_patt;
1524 break;
1525 }
1526 }
1527 else
1528 {
1529 switch (fragP->tc_frag_data.tune)
1530 {
1531 case PROCESSOR_UNKNOWN:
1532 /* When cpu_arch_isa is set, cpu_arch_tune shouldn't be
1533 PROCESSOR_UNKNOWN. */
1534 abort ();
1535 break;
1536
1537 case PROCESSOR_I386:
1538 case PROCESSOR_I486:
1539 case PROCESSOR_PENTIUM:
1540 case PROCESSOR_IAMCU:
1541 case PROCESSOR_K6:
1542 case PROCESSOR_ATHLON:
1543 case PROCESSOR_K8:
1544 case PROCESSOR_AMDFAM10:
1545 case PROCESSOR_BD:
1546 case PROCESSOR_ZNVER:
1547 case PROCESSOR_BT:
1548 case PROCESSOR_GENERIC32:
1549 /* We use cpu_arch_isa_flags to check if we CAN optimize
1550 with nops. */
1551 if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1552 patt = alt_patt;
1553 else
1554 patt = f32_patt;
1555 break;
1556 case PROCESSOR_PENTIUMPRO:
1557 case PROCESSOR_PENTIUM4:
1558 case PROCESSOR_NOCONA:
1559 case PROCESSOR_CORE:
1560 case PROCESSOR_CORE2:
1561 case PROCESSOR_COREI7:
1562 case PROCESSOR_L1OM:
1563 case PROCESSOR_K1OM:
1564 if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1565 patt = alt_patt;
1566 else
1567 patt = f32_patt;
1568 break;
1569 case PROCESSOR_GENERIC64:
1570 patt = alt_patt;
1571 break;
1572 }
1573 }
1574
1575 if (patt == f32_patt)
1576 {
1577 max_single_nop_size = sizeof (f32_patt) / sizeof (f32_patt[0]);
1578 /* Limit number of NOPs to 2 for older processors. */
1579 max_number_of_nops = 2;
1580 }
1581 else
1582 {
1583 max_single_nop_size = sizeof (alt_patt) / sizeof (alt_patt[0]);
1584 /* Limit number of NOPs to 7 for newer processors. */
1585 max_number_of_nops = 7;
1586 }
1587 }
1588
1589 if (limit == 0)
1590 limit = max_single_nop_size;
1591
1592 if (fragP->fr_type == rs_fill_nop)
1593 {
1594 /* Output NOPs for .nop directive. */
1595 if (limit > max_single_nop_size)
1596 {
1597 as_bad_where (fragP->fr_file, fragP->fr_line,
1598 _("invalid single nop size: %d "
1599 "(expect within [0, %d])"),
1600 limit, max_single_nop_size);
1601 return;
1602 }
1603 }
1604 else if (fragP->fr_type != rs_machine_dependent)
1605 fragP->fr_var = count;
1606
1607 if ((count / max_single_nop_size) > max_number_of_nops)
1608 {
1609 /* Generate jump over NOPs. */
1610 offsetT disp = count - 2;
1611 if (fits_in_imm7 (disp))
1612 {
1613 /* Use "jmp disp8" if possible. */
1614 count = disp;
1615 where[0] = jump_disp8[0];
1616 where[1] = count;
1617 where += 2;
1618 }
1619 else
1620 {
1621 unsigned int size_of_jump;
1622
1623 if (flag_code == CODE_16BIT)
1624 {
1625 where[0] = jump16_disp32[0];
1626 where[1] = jump16_disp32[1];
1627 size_of_jump = 2;
1628 }
1629 else
1630 {
1631 where[0] = jump32_disp32[0];
1632 size_of_jump = 1;
1633 }
1634
1635 count -= size_of_jump + 4;
1636 if (!fits_in_imm31 (count))
1637 {
1638 as_bad_where (fragP->fr_file, fragP->fr_line,
1639 _("jump over nop padding out of range"));
1640 return;
1641 }
1642
1643 md_number_to_chars (where + size_of_jump, count, 4);
1644 where += size_of_jump + 4;
1645 }
1646 }
1647
1648 /* Generate multiple NOPs. */
1649 i386_output_nops (where, patt, count, limit);
1650 }
1651
1652 static INLINE int
1653 operand_type_all_zero (const union i386_operand_type *x)
1654 {
1655 switch (ARRAY_SIZE(x->array))
1656 {
1657 case 3:
1658 if (x->array[2])
1659 return 0;
1660 /* Fall through. */
1661 case 2:
1662 if (x->array[1])
1663 return 0;
1664 /* Fall through. */
1665 case 1:
1666 return !x->array[0];
1667 default:
1668 abort ();
1669 }
1670 }
1671
1672 static INLINE void
1673 operand_type_set (union i386_operand_type *x, unsigned int v)
1674 {
1675 switch (ARRAY_SIZE(x->array))
1676 {
1677 case 3:
1678 x->array[2] = v;
1679 /* Fall through. */
1680 case 2:
1681 x->array[1] = v;
1682 /* Fall through. */
1683 case 1:
1684 x->array[0] = v;
1685 /* Fall through. */
1686 break;
1687 default:
1688 abort ();
1689 }
1690
1691 x->bitfield.class = ClassNone;
1692 x->bitfield.instance = InstanceNone;
1693 }
1694
1695 static INLINE int
1696 operand_type_equal (const union i386_operand_type *x,
1697 const union i386_operand_type *y)
1698 {
1699 switch (ARRAY_SIZE(x->array))
1700 {
1701 case 3:
1702 if (x->array[2] != y->array[2])
1703 return 0;
1704 /* Fall through. */
1705 case 2:
1706 if (x->array[1] != y->array[1])
1707 return 0;
1708 /* Fall through. */
1709 case 1:
1710 return x->array[0] == y->array[0];
1711 break;
1712 default:
1713 abort ();
1714 }
1715 }
1716
1717 static INLINE int
1718 cpu_flags_all_zero (const union i386_cpu_flags *x)
1719 {
1720 switch (ARRAY_SIZE(x->array))
1721 {
1722 case 4:
1723 if (x->array[3])
1724 return 0;
1725 /* Fall through. */
1726 case 3:
1727 if (x->array[2])
1728 return 0;
1729 /* Fall through. */
1730 case 2:
1731 if (x->array[1])
1732 return 0;
1733 /* Fall through. */
1734 case 1:
1735 return !x->array[0];
1736 default:
1737 abort ();
1738 }
1739 }
1740
1741 static INLINE int
1742 cpu_flags_equal (const union i386_cpu_flags *x,
1743 const union i386_cpu_flags *y)
1744 {
1745 switch (ARRAY_SIZE(x->array))
1746 {
1747 case 4:
1748 if (x->array[3] != y->array[3])
1749 return 0;
1750 /* Fall through. */
1751 case 3:
1752 if (x->array[2] != y->array[2])
1753 return 0;
1754 /* Fall through. */
1755 case 2:
1756 if (x->array[1] != y->array[1])
1757 return 0;
1758 /* Fall through. */
1759 case 1:
1760 return x->array[0] == y->array[0];
1761 break;
1762 default:
1763 abort ();
1764 }
1765 }
1766
1767 static INLINE int
1768 cpu_flags_check_cpu64 (i386_cpu_flags f)
1769 {
1770 return !((flag_code == CODE_64BIT && f.bitfield.cpuno64)
1771 || (flag_code != CODE_64BIT && f.bitfield.cpu64));
1772 }
1773
1774 static INLINE i386_cpu_flags
1775 cpu_flags_and (i386_cpu_flags x, i386_cpu_flags y)
1776 {
1777 switch (ARRAY_SIZE (x.array))
1778 {
1779 case 4:
1780 x.array [3] &= y.array [3];
1781 /* Fall through. */
1782 case 3:
1783 x.array [2] &= y.array [2];
1784 /* Fall through. */
1785 case 2:
1786 x.array [1] &= y.array [1];
1787 /* Fall through. */
1788 case 1:
1789 x.array [0] &= y.array [0];
1790 break;
1791 default:
1792 abort ();
1793 }
1794 return x;
1795 }
1796
1797 static INLINE i386_cpu_flags
1798 cpu_flags_or (i386_cpu_flags x, i386_cpu_flags y)
1799 {
1800 switch (ARRAY_SIZE (x.array))
1801 {
1802 case 4:
1803 x.array [3] |= y.array [3];
1804 /* Fall through. */
1805 case 3:
1806 x.array [2] |= y.array [2];
1807 /* Fall through. */
1808 case 2:
1809 x.array [1] |= y.array [1];
1810 /* Fall through. */
1811 case 1:
1812 x.array [0] |= y.array [0];
1813 break;
1814 default:
1815 abort ();
1816 }
1817 return x;
1818 }
1819
1820 static INLINE i386_cpu_flags
1821 cpu_flags_and_not (i386_cpu_flags x, i386_cpu_flags y)
1822 {
1823 switch (ARRAY_SIZE (x.array))
1824 {
1825 case 4:
1826 x.array [3] &= ~y.array [3];
1827 /* Fall through. */
1828 case 3:
1829 x.array [2] &= ~y.array [2];
1830 /* Fall through. */
1831 case 2:
1832 x.array [1] &= ~y.array [1];
1833 /* Fall through. */
1834 case 1:
1835 x.array [0] &= ~y.array [0];
1836 break;
1837 default:
1838 abort ();
1839 }
1840 return x;
1841 }
1842
1843 static const i386_cpu_flags avx512 = CPU_ANY_AVX512F_FLAGS;
1844
1845 #define CPU_FLAGS_ARCH_MATCH 0x1
1846 #define CPU_FLAGS_64BIT_MATCH 0x2
1847
1848 #define CPU_FLAGS_PERFECT_MATCH \
1849 (CPU_FLAGS_ARCH_MATCH | CPU_FLAGS_64BIT_MATCH)
1850
1851 /* Return CPU flags match bits. */
1852
1853 static int
1854 cpu_flags_match (const insn_template *t)
1855 {
1856 i386_cpu_flags x = t->cpu_flags;
1857 int match = cpu_flags_check_cpu64 (x) ? CPU_FLAGS_64BIT_MATCH : 0;
1858
1859 x.bitfield.cpu64 = 0;
1860 x.bitfield.cpuno64 = 0;
1861
1862 if (cpu_flags_all_zero (&x))
1863 {
1864 /* This instruction is available on all archs. */
1865 match |= CPU_FLAGS_ARCH_MATCH;
1866 }
1867 else
1868 {
1869 /* This instruction is available only on some archs. */
1870 i386_cpu_flags cpu = cpu_arch_flags;
1871
1872 /* AVX512VL is no standalone feature - match it and then strip it. */
1873 if (x.bitfield.cpuavx512vl && !cpu.bitfield.cpuavx512vl)
1874 return match;
1875 x.bitfield.cpuavx512vl = 0;
1876
1877 cpu = cpu_flags_and (x, cpu);
1878 if (!cpu_flags_all_zero (&cpu))
1879 {
1880 if (x.bitfield.cpuavx)
1881 {
1882 /* We need to check a few extra flags with AVX. */
1883 if (cpu.bitfield.cpuavx
1884 && (!t->opcode_modifier.sse2avx || sse2avx)
1885 && (!x.bitfield.cpuaes || cpu.bitfield.cpuaes)
1886 && (!x.bitfield.cpugfni || cpu.bitfield.cpugfni)
1887 && (!x.bitfield.cpupclmul || cpu.bitfield.cpupclmul))
1888 match |= CPU_FLAGS_ARCH_MATCH;
1889 }
1890 else if (x.bitfield.cpuavx512f)
1891 {
1892 /* We need to check a few extra flags with AVX512F. */
1893 if (cpu.bitfield.cpuavx512f
1894 && (!x.bitfield.cpugfni || cpu.bitfield.cpugfni)
1895 && (!x.bitfield.cpuvaes || cpu.bitfield.cpuvaes)
1896 && (!x.bitfield.cpuvpclmulqdq || cpu.bitfield.cpuvpclmulqdq))
1897 match |= CPU_FLAGS_ARCH_MATCH;
1898 }
1899 else
1900 match |= CPU_FLAGS_ARCH_MATCH;
1901 }
1902 }
1903 return match;
1904 }
1905
1906 static INLINE i386_operand_type
1907 operand_type_and (i386_operand_type x, i386_operand_type y)
1908 {
1909 if (x.bitfield.class != y.bitfield.class)
1910 x.bitfield.class = ClassNone;
1911 if (x.bitfield.instance != y.bitfield.instance)
1912 x.bitfield.instance = InstanceNone;
1913
1914 switch (ARRAY_SIZE (x.array))
1915 {
1916 case 3:
1917 x.array [2] &= y.array [2];
1918 /* Fall through. */
1919 case 2:
1920 x.array [1] &= y.array [1];
1921 /* Fall through. */
1922 case 1:
1923 x.array [0] &= y.array [0];
1924 break;
1925 default:
1926 abort ();
1927 }
1928 return x;
1929 }
1930
1931 static INLINE i386_operand_type
1932 operand_type_and_not (i386_operand_type x, i386_operand_type y)
1933 {
1934 gas_assert (y.bitfield.class == ClassNone);
1935 gas_assert (y.bitfield.instance == InstanceNone);
1936
1937 switch (ARRAY_SIZE (x.array))
1938 {
1939 case 3:
1940 x.array [2] &= ~y.array [2];
1941 /* Fall through. */
1942 case 2:
1943 x.array [1] &= ~y.array [1];
1944 /* Fall through. */
1945 case 1:
1946 x.array [0] &= ~y.array [0];
1947 break;
1948 default:
1949 abort ();
1950 }
1951 return x;
1952 }
1953
1954 static INLINE i386_operand_type
1955 operand_type_or (i386_operand_type x, i386_operand_type y)
1956 {
1957 gas_assert (x.bitfield.class == ClassNone ||
1958 y.bitfield.class == ClassNone ||
1959 x.bitfield.class == y.bitfield.class);
1960 gas_assert (x.bitfield.instance == InstanceNone ||
1961 y.bitfield.instance == InstanceNone ||
1962 x.bitfield.instance == y.bitfield.instance);
1963
1964 switch (ARRAY_SIZE (x.array))
1965 {
1966 case 3:
1967 x.array [2] |= y.array [2];
1968 /* Fall through. */
1969 case 2:
1970 x.array [1] |= y.array [1];
1971 /* Fall through. */
1972 case 1:
1973 x.array [0] |= y.array [0];
1974 break;
1975 default:
1976 abort ();
1977 }
1978 return x;
1979 }
1980
1981 static INLINE i386_operand_type
1982 operand_type_xor (i386_operand_type x, i386_operand_type y)
1983 {
1984 gas_assert (y.bitfield.class == ClassNone);
1985 gas_assert (y.bitfield.instance == InstanceNone);
1986
1987 switch (ARRAY_SIZE (x.array))
1988 {
1989 case 3:
1990 x.array [2] ^= y.array [2];
1991 /* Fall through. */
1992 case 2:
1993 x.array [1] ^= y.array [1];
1994 /* Fall through. */
1995 case 1:
1996 x.array [0] ^= y.array [0];
1997 break;
1998 default:
1999 abort ();
2000 }
2001 return x;
2002 }
2003
2004 static const i386_operand_type disp16 = OPERAND_TYPE_DISP16;
2005 static const i386_operand_type disp32 = OPERAND_TYPE_DISP32;
2006 static const i386_operand_type disp32s = OPERAND_TYPE_DISP32S;
2007 static const i386_operand_type disp16_32 = OPERAND_TYPE_DISP16_32;
2008 static const i386_operand_type anydisp = OPERAND_TYPE_ANYDISP;
2009 static const i386_operand_type anyimm = OPERAND_TYPE_ANYIMM;
2010 static const i386_operand_type regxmm = OPERAND_TYPE_REGXMM;
2011 static const i386_operand_type regmask = OPERAND_TYPE_REGMASK;
2012 static const i386_operand_type imm8 = OPERAND_TYPE_IMM8;
2013 static const i386_operand_type imm8s = OPERAND_TYPE_IMM8S;
2014 static const i386_operand_type imm16 = OPERAND_TYPE_IMM16;
2015 static const i386_operand_type imm32 = OPERAND_TYPE_IMM32;
2016 static const i386_operand_type imm32s = OPERAND_TYPE_IMM32S;
2017 static const i386_operand_type imm64 = OPERAND_TYPE_IMM64;
2018 static const i386_operand_type imm16_32 = OPERAND_TYPE_IMM16_32;
2019 static const i386_operand_type imm16_32s = OPERAND_TYPE_IMM16_32S;
2020 static const i386_operand_type imm16_32_32s = OPERAND_TYPE_IMM16_32_32S;
2021
2022 enum operand_type
2023 {
2024 reg,
2025 imm,
2026 disp,
2027 anymem
2028 };
2029
2030 static INLINE int
2031 operand_type_check (i386_operand_type t, enum operand_type c)
2032 {
2033 switch (c)
2034 {
2035 case reg:
2036 return t.bitfield.class == Reg;
2037
2038 case imm:
2039 return (t.bitfield.imm8
2040 || t.bitfield.imm8s
2041 || t.bitfield.imm16
2042 || t.bitfield.imm32
2043 || t.bitfield.imm32s
2044 || t.bitfield.imm64);
2045
2046 case disp:
2047 return (t.bitfield.disp8
2048 || t.bitfield.disp16
2049 || t.bitfield.disp32
2050 || t.bitfield.disp32s
2051 || t.bitfield.disp64);
2052
2053 case anymem:
2054 return (t.bitfield.disp8
2055 || t.bitfield.disp16
2056 || t.bitfield.disp32
2057 || t.bitfield.disp32s
2058 || t.bitfield.disp64
2059 || t.bitfield.baseindex);
2060
2061 default:
2062 abort ();
2063 }
2064
2065 return 0;
2066 }
2067
2068 /* Return 1 if there is no conflict in 8bit/16bit/32bit/64bit/80bit size
2069 between operand GIVEN and opeand WANTED for instruction template T. */
2070
2071 static INLINE int
2072 match_operand_size (const insn_template *t, unsigned int wanted,
2073 unsigned int given)
2074 {
2075 return !((i.types[given].bitfield.byte
2076 && !t->operand_types[wanted].bitfield.byte)
2077 || (i.types[given].bitfield.word
2078 && !t->operand_types[wanted].bitfield.word)
2079 || (i.types[given].bitfield.dword
2080 && !t->operand_types[wanted].bitfield.dword)
2081 || (i.types[given].bitfield.qword
2082 && !t->operand_types[wanted].bitfield.qword)
2083 || (i.types[given].bitfield.tbyte
2084 && !t->operand_types[wanted].bitfield.tbyte));
2085 }
2086
2087 /* Return 1 if there is no conflict in SIMD register between operand
2088 GIVEN and opeand WANTED for instruction template T. */
2089
2090 static INLINE int
2091 match_simd_size (const insn_template *t, unsigned int wanted,
2092 unsigned int given)
2093 {
2094 return !((i.types[given].bitfield.xmmword
2095 && !t->operand_types[wanted].bitfield.xmmword)
2096 || (i.types[given].bitfield.ymmword
2097 && !t->operand_types[wanted].bitfield.ymmword)
2098 || (i.types[given].bitfield.zmmword
2099 && !t->operand_types[wanted].bitfield.zmmword));
2100 }
2101
2102 /* Return 1 if there is no conflict in any size between operand GIVEN
2103 and opeand WANTED for instruction template T. */
2104
2105 static INLINE int
2106 match_mem_size (const insn_template *t, unsigned int wanted,
2107 unsigned int given)
2108 {
2109 return (match_operand_size (t, wanted, given)
2110 && !((i.types[given].bitfield.unspecified
2111 && !i.broadcast
2112 && !t->operand_types[wanted].bitfield.unspecified)
2113 || (i.types[given].bitfield.fword
2114 && !t->operand_types[wanted].bitfield.fword)
2115 /* For scalar opcode templates to allow register and memory
2116 operands at the same time, some special casing is needed
2117 here. Also for v{,p}broadcast*, {,v}pmov{s,z}*, and
2118 down-conversion vpmov*. */
2119 || ((t->operand_types[wanted].bitfield.class == RegSIMD
2120 && !t->opcode_modifier.broadcast
2121 && (t->operand_types[wanted].bitfield.byte
2122 || t->operand_types[wanted].bitfield.word
2123 || t->operand_types[wanted].bitfield.dword
2124 || t->operand_types[wanted].bitfield.qword))
2125 ? (i.types[given].bitfield.xmmword
2126 || i.types[given].bitfield.ymmword
2127 || i.types[given].bitfield.zmmword)
2128 : !match_simd_size(t, wanted, given))));
2129 }
2130
2131 /* Return value has MATCH_STRAIGHT set if there is no size conflict on any
2132 operands for instruction template T, and it has MATCH_REVERSE set if there
2133 is no size conflict on any operands for the template with operands reversed
2134 (and the template allows for reversing in the first place). */
2135
2136 #define MATCH_STRAIGHT 1
2137 #define MATCH_REVERSE 2
2138
2139 static INLINE unsigned int
2140 operand_size_match (const insn_template *t)
2141 {
2142 unsigned int j, match = MATCH_STRAIGHT;
2143
2144 /* Don't check non-absolute jump instructions. */
2145 if (t->opcode_modifier.jump
2146 && t->opcode_modifier.jump != JUMP_ABSOLUTE)
2147 return match;
2148
2149 /* Check memory and accumulator operand size. */
2150 for (j = 0; j < i.operands; j++)
2151 {
2152 if (i.types[j].bitfield.class != Reg
2153 && i.types[j].bitfield.class != RegSIMD
2154 && t->opcode_modifier.anysize)
2155 continue;
2156
2157 if (t->operand_types[j].bitfield.class == Reg
2158 && !match_operand_size (t, j, j))
2159 {
2160 match = 0;
2161 break;
2162 }
2163
2164 if (t->operand_types[j].bitfield.class == RegSIMD
2165 && !match_simd_size (t, j, j))
2166 {
2167 match = 0;
2168 break;
2169 }
2170
2171 if (t->operand_types[j].bitfield.instance == Accum
2172 && (!match_operand_size (t, j, j) || !match_simd_size (t, j, j)))
2173 {
2174 match = 0;
2175 break;
2176 }
2177
2178 if ((i.flags[j] & Operand_Mem) && !match_mem_size (t, j, j))
2179 {
2180 match = 0;
2181 break;
2182 }
2183 }
2184
2185 if (!t->opcode_modifier.d)
2186 {
2187 mismatch:
2188 if (!match)
2189 i.error = operand_size_mismatch;
2190 return match;
2191 }
2192
2193 /* Check reverse. */
2194 gas_assert (i.operands >= 2 && i.operands <= 3);
2195
2196 for (j = 0; j < i.operands; j++)
2197 {
2198 unsigned int given = i.operands - j - 1;
2199
2200 if (t->operand_types[j].bitfield.class == Reg
2201 && !match_operand_size (t, j, given))
2202 goto mismatch;
2203
2204 if (t->operand_types[j].bitfield.class == RegSIMD
2205 && !match_simd_size (t, j, given))
2206 goto mismatch;
2207
2208 if (t->operand_types[j].bitfield.instance == Accum
2209 && (!match_operand_size (t, j, given)
2210 || !match_simd_size (t, j, given)))
2211 goto mismatch;
2212
2213 if ((i.flags[given] & Operand_Mem) && !match_mem_size (t, j, given))
2214 goto mismatch;
2215 }
2216
2217 return match | MATCH_REVERSE;
2218 }
2219
2220 static INLINE int
2221 operand_type_match (i386_operand_type overlap,
2222 i386_operand_type given)
2223 {
2224 i386_operand_type temp = overlap;
2225
2226 temp.bitfield.unspecified = 0;
2227 temp.bitfield.byte = 0;
2228 temp.bitfield.word = 0;
2229 temp.bitfield.dword = 0;
2230 temp.bitfield.fword = 0;
2231 temp.bitfield.qword = 0;
2232 temp.bitfield.tbyte = 0;
2233 temp.bitfield.xmmword = 0;
2234 temp.bitfield.ymmword = 0;
2235 temp.bitfield.zmmword = 0;
2236 if (operand_type_all_zero (&temp))
2237 goto mismatch;
2238
2239 if (given.bitfield.baseindex == overlap.bitfield.baseindex)
2240 return 1;
2241
2242 mismatch:
2243 i.error = operand_type_mismatch;
2244 return 0;
2245 }
2246
2247 /* If given types g0 and g1 are registers they must be of the same type
2248 unless the expected operand type register overlap is null.
2249 Some Intel syntax memory operand size checking also happens here. */
2250
2251 static INLINE int
2252 operand_type_register_match (i386_operand_type g0,
2253 i386_operand_type t0,
2254 i386_operand_type g1,
2255 i386_operand_type t1)
2256 {
2257 if (g0.bitfield.class != Reg
2258 && g0.bitfield.class != RegSIMD
2259 && (!operand_type_check (g0, anymem)
2260 || g0.bitfield.unspecified
2261 || (t0.bitfield.class != Reg
2262 && t0.bitfield.class != RegSIMD)))
2263 return 1;
2264
2265 if (g1.bitfield.class != Reg
2266 && g1.bitfield.class != RegSIMD
2267 && (!operand_type_check (g1, anymem)
2268 || g1.bitfield.unspecified
2269 || (t1.bitfield.class != Reg
2270 && t1.bitfield.class != RegSIMD)))
2271 return 1;
2272
2273 if (g0.bitfield.byte == g1.bitfield.byte
2274 && g0.bitfield.word == g1.bitfield.word
2275 && g0.bitfield.dword == g1.bitfield.dword
2276 && g0.bitfield.qword == g1.bitfield.qword
2277 && g0.bitfield.xmmword == g1.bitfield.xmmword
2278 && g0.bitfield.ymmword == g1.bitfield.ymmword
2279 && g0.bitfield.zmmword == g1.bitfield.zmmword)
2280 return 1;
2281
2282 if (!(t0.bitfield.byte & t1.bitfield.byte)
2283 && !(t0.bitfield.word & t1.bitfield.word)
2284 && !(t0.bitfield.dword & t1.bitfield.dword)
2285 && !(t0.bitfield.qword & t1.bitfield.qword)
2286 && !(t0.bitfield.xmmword & t1.bitfield.xmmword)
2287 && !(t0.bitfield.ymmword & t1.bitfield.ymmword)
2288 && !(t0.bitfield.zmmword & t1.bitfield.zmmword))
2289 return 1;
2290
2291 i.error = register_type_mismatch;
2292
2293 return 0;
2294 }
2295
2296 static INLINE unsigned int
2297 register_number (const reg_entry *r)
2298 {
2299 unsigned int nr = r->reg_num;
2300
2301 if (r->reg_flags & RegRex)
2302 nr += 8;
2303
2304 if (r->reg_flags & RegVRex)
2305 nr += 16;
2306
2307 return nr;
2308 }
2309
2310 static INLINE unsigned int
2311 mode_from_disp_size (i386_operand_type t)
2312 {
2313 if (t.bitfield.disp8)
2314 return 1;
2315 else if (t.bitfield.disp16
2316 || t.bitfield.disp32
2317 || t.bitfield.disp32s)
2318 return 2;
2319 else
2320 return 0;
2321 }
2322
2323 static INLINE int
2324 fits_in_signed_byte (addressT num)
2325 {
2326 return num + 0x80 <= 0xff;
2327 }
2328
2329 static INLINE int
2330 fits_in_unsigned_byte (addressT num)
2331 {
2332 return num <= 0xff;
2333 }
2334
2335 static INLINE int
2336 fits_in_unsigned_word (addressT num)
2337 {
2338 return num <= 0xffff;
2339 }
2340
2341 static INLINE int
2342 fits_in_signed_word (addressT num)
2343 {
2344 return num + 0x8000 <= 0xffff;
2345 }
2346
2347 static INLINE int
2348 fits_in_signed_long (addressT num ATTRIBUTE_UNUSED)
2349 {
2350 #ifndef BFD64
2351 return 1;
2352 #else
2353 return num + 0x80000000 <= 0xffffffff;
2354 #endif
2355 } /* fits_in_signed_long() */
2356
2357 static INLINE int
2358 fits_in_unsigned_long (addressT num ATTRIBUTE_UNUSED)
2359 {
2360 #ifndef BFD64
2361 return 1;
2362 #else
2363 return num <= 0xffffffff;
2364 #endif
2365 } /* fits_in_unsigned_long() */
2366
2367 static INLINE int
2368 fits_in_disp8 (offsetT num)
2369 {
2370 int shift = i.memshift;
2371 unsigned int mask;
2372
2373 if (shift == -1)
2374 abort ();
2375
2376 mask = (1 << shift) - 1;
2377
2378 /* Return 0 if NUM isn't properly aligned. */
2379 if ((num & mask))
2380 return 0;
2381
2382 /* Check if NUM will fit in 8bit after shift. */
2383 return fits_in_signed_byte (num >> shift);
2384 }
2385
2386 static INLINE int
2387 fits_in_imm4 (offsetT num)
2388 {
2389 return (num & 0xf) == num;
2390 }
2391
2392 static i386_operand_type
2393 smallest_imm_type (offsetT num)
2394 {
2395 i386_operand_type t;
2396
2397 operand_type_set (&t, 0);
2398 t.bitfield.imm64 = 1;
2399
2400 if (cpu_arch_tune != PROCESSOR_I486 && num == 1)
2401 {
2402 /* This code is disabled on the 486 because all the Imm1 forms
2403 in the opcode table are slower on the i486. They're the
2404 versions with the implicitly specified single-position
2405 displacement, which has another syntax if you really want to
2406 use that form. */
2407 t.bitfield.imm1 = 1;
2408 t.bitfield.imm8 = 1;
2409 t.bitfield.imm8s = 1;
2410 t.bitfield.imm16 = 1;
2411 t.bitfield.imm32 = 1;
2412 t.bitfield.imm32s = 1;
2413 }
2414 else if (fits_in_signed_byte (num))
2415 {
2416 t.bitfield.imm8 = 1;
2417 t.bitfield.imm8s = 1;
2418 t.bitfield.imm16 = 1;
2419 t.bitfield.imm32 = 1;
2420 t.bitfield.imm32s = 1;
2421 }
2422 else if (fits_in_unsigned_byte (num))
2423 {
2424 t.bitfield.imm8 = 1;
2425 t.bitfield.imm16 = 1;
2426 t.bitfield.imm32 = 1;
2427 t.bitfield.imm32s = 1;
2428 }
2429 else if (fits_in_signed_word (num) || fits_in_unsigned_word (num))
2430 {
2431 t.bitfield.imm16 = 1;
2432 t.bitfield.imm32 = 1;
2433 t.bitfield.imm32s = 1;
2434 }
2435 else if (fits_in_signed_long (num))
2436 {
2437 t.bitfield.imm32 = 1;
2438 t.bitfield.imm32s = 1;
2439 }
2440 else if (fits_in_unsigned_long (num))
2441 t.bitfield.imm32 = 1;
2442
2443 return t;
2444 }
2445
2446 static offsetT
2447 offset_in_range (offsetT val, int size)
2448 {
2449 addressT mask;
2450
2451 switch (size)
2452 {
2453 case 1: mask = ((addressT) 1 << 8) - 1; break;
2454 case 2: mask = ((addressT) 1 << 16) - 1; break;
2455 case 4: mask = ((addressT) 2 << 31) - 1; break;
2456 #ifdef BFD64
2457 case 8: mask = ((addressT) 2 << 63) - 1; break;
2458 #endif
2459 default: abort ();
2460 }
2461
2462 #ifdef BFD64
2463 /* If BFD64, sign extend val for 32bit address mode. */
2464 if (flag_code != CODE_64BIT
2465 || i.prefix[ADDR_PREFIX])
2466 if ((val & ~(((addressT) 2 << 31) - 1)) == 0)
2467 val = (val ^ ((addressT) 1 << 31)) - ((addressT) 1 << 31);
2468 #endif
2469
2470 if ((val & ~mask) != 0 && (val & ~mask) != ~mask)
2471 {
2472 char buf1[40], buf2[40];
2473
2474 sprint_value (buf1, val);
2475 sprint_value (buf2, val & mask);
2476 as_warn (_("%s shortened to %s"), buf1, buf2);
2477 }
2478 return val & mask;
2479 }
2480
2481 enum PREFIX_GROUP
2482 {
2483 PREFIX_EXIST = 0,
2484 PREFIX_LOCK,
2485 PREFIX_REP,
2486 PREFIX_DS,
2487 PREFIX_OTHER
2488 };
2489
2490 /* Returns
2491 a. PREFIX_EXIST if attempting to add a prefix where one from the
2492 same class already exists.
2493 b. PREFIX_LOCK if lock prefix is added.
2494 c. PREFIX_REP if rep/repne prefix is added.
2495 d. PREFIX_DS if ds prefix is added.
2496 e. PREFIX_OTHER if other prefix is added.
2497 */
2498
2499 static enum PREFIX_GROUP
2500 add_prefix (unsigned int prefix)
2501 {
2502 enum PREFIX_GROUP ret = PREFIX_OTHER;
2503 unsigned int q;
2504
2505 if (prefix >= REX_OPCODE && prefix < REX_OPCODE + 16
2506 && flag_code == CODE_64BIT)
2507 {
2508 if ((i.prefix[REX_PREFIX] & prefix & REX_W)
2509 || (i.prefix[REX_PREFIX] & prefix & REX_R)
2510 || (i.prefix[REX_PREFIX] & prefix & REX_X)
2511 || (i.prefix[REX_PREFIX] & prefix & REX_B))
2512 ret = PREFIX_EXIST;
2513 q = REX_PREFIX;
2514 }
2515 else
2516 {
2517 switch (prefix)
2518 {
2519 default:
2520 abort ();
2521
2522 case DS_PREFIX_OPCODE:
2523 ret = PREFIX_DS;
2524 /* Fall through. */
2525 case CS_PREFIX_OPCODE:
2526 case ES_PREFIX_OPCODE:
2527 case FS_PREFIX_OPCODE:
2528 case GS_PREFIX_OPCODE:
2529 case SS_PREFIX_OPCODE:
2530 q = SEG_PREFIX;
2531 break;
2532
2533 case REPNE_PREFIX_OPCODE:
2534 case REPE_PREFIX_OPCODE:
2535 q = REP_PREFIX;
2536 ret = PREFIX_REP;
2537 break;
2538
2539 case LOCK_PREFIX_OPCODE:
2540 q = LOCK_PREFIX;
2541 ret = PREFIX_LOCK;
2542 break;
2543
2544 case FWAIT_OPCODE:
2545 q = WAIT_PREFIX;
2546 break;
2547
2548 case ADDR_PREFIX_OPCODE:
2549 q = ADDR_PREFIX;
2550 break;
2551
2552 case DATA_PREFIX_OPCODE:
2553 q = DATA_PREFIX;
2554 break;
2555 }
2556 if (i.prefix[q] != 0)
2557 ret = PREFIX_EXIST;
2558 }
2559
2560 if (ret)
2561 {
2562 if (!i.prefix[q])
2563 ++i.prefixes;
2564 i.prefix[q] |= prefix;
2565 }
2566 else
2567 as_bad (_("same type of prefix used twice"));
2568
2569 return ret;
2570 }
2571
2572 static void
2573 update_code_flag (int value, int check)
2574 {
2575 PRINTF_LIKE ((*as_error));
2576
2577 flag_code = (enum flag_code) value;
2578 if (flag_code == CODE_64BIT)
2579 {
2580 cpu_arch_flags.bitfield.cpu64 = 1;
2581 cpu_arch_flags.bitfield.cpuno64 = 0;
2582 }
2583 else
2584 {
2585 cpu_arch_flags.bitfield.cpu64 = 0;
2586 cpu_arch_flags.bitfield.cpuno64 = 1;
2587 }
2588 if (value == CODE_64BIT && !cpu_arch_flags.bitfield.cpulm )
2589 {
2590 if (check)
2591 as_error = as_fatal;
2592 else
2593 as_error = as_bad;
2594 (*as_error) (_("64bit mode not supported on `%s'."),
2595 cpu_arch_name ? cpu_arch_name : default_arch);
2596 }
2597 if (value == CODE_32BIT && !cpu_arch_flags.bitfield.cpui386)
2598 {
2599 if (check)
2600 as_error = as_fatal;
2601 else
2602 as_error = as_bad;
2603 (*as_error) (_("32bit mode not supported on `%s'."),
2604 cpu_arch_name ? cpu_arch_name : default_arch);
2605 }
2606 stackop_size = '\0';
2607 }
2608
2609 static void
2610 set_code_flag (int value)
2611 {
2612 update_code_flag (value, 0);
2613 }
2614
2615 static void
2616 set_16bit_gcc_code_flag (int new_code_flag)
2617 {
2618 flag_code = (enum flag_code) new_code_flag;
2619 if (flag_code != CODE_16BIT)
2620 abort ();
2621 cpu_arch_flags.bitfield.cpu64 = 0;
2622 cpu_arch_flags.bitfield.cpuno64 = 1;
2623 stackop_size = LONG_MNEM_SUFFIX;
2624 }
2625
2626 static void
2627 set_intel_syntax (int syntax_flag)
2628 {
2629 /* Find out if register prefixing is specified. */
2630 int ask_naked_reg = 0;
2631
2632 SKIP_WHITESPACE ();
2633 if (!is_end_of_line[(unsigned char) *input_line_pointer])
2634 {
2635 char *string;
2636 int e = get_symbol_name (&string);
2637
2638 if (strcmp (string, "prefix") == 0)
2639 ask_naked_reg = 1;
2640 else if (strcmp (string, "noprefix") == 0)
2641 ask_naked_reg = -1;
2642 else
2643 as_bad (_("bad argument to syntax directive."));
2644 (void) restore_line_pointer (e);
2645 }
2646 demand_empty_rest_of_line ();
2647
2648 intel_syntax = syntax_flag;
2649
2650 if (ask_naked_reg == 0)
2651 allow_naked_reg = (intel_syntax
2652 && (bfd_get_symbol_leading_char (stdoutput) != '\0'));
2653 else
2654 allow_naked_reg = (ask_naked_reg < 0);
2655
2656 expr_set_rank (O_full_ptr, syntax_flag ? 10 : 0);
2657
2658 identifier_chars['%'] = intel_syntax && allow_naked_reg ? '%' : 0;
2659 identifier_chars['$'] = intel_syntax ? '$' : 0;
2660 register_prefix = allow_naked_reg ? "" : "%";
2661 }
2662
2663 static void
2664 set_intel_mnemonic (int mnemonic_flag)
2665 {
2666 intel_mnemonic = mnemonic_flag;
2667 }
2668
2669 static void
2670 set_allow_index_reg (int flag)
2671 {
2672 allow_index_reg = flag;
2673 }
2674
2675 static void
2676 set_check (int what)
2677 {
2678 enum check_kind *kind;
2679 const char *str;
2680
2681 if (what)
2682 {
2683 kind = &operand_check;
2684 str = "operand";
2685 }
2686 else
2687 {
2688 kind = &sse_check;
2689 str = "sse";
2690 }
2691
2692 SKIP_WHITESPACE ();
2693
2694 if (!is_end_of_line[(unsigned char) *input_line_pointer])
2695 {
2696 char *string;
2697 int e = get_symbol_name (&string);
2698
2699 if (strcmp (string, "none") == 0)
2700 *kind = check_none;
2701 else if (strcmp (string, "warning") == 0)
2702 *kind = check_warning;
2703 else if (strcmp (string, "error") == 0)
2704 *kind = check_error;
2705 else
2706 as_bad (_("bad argument to %s_check directive."), str);
2707 (void) restore_line_pointer (e);
2708 }
2709 else
2710 as_bad (_("missing argument for %s_check directive"), str);
2711
2712 demand_empty_rest_of_line ();
2713 }
2714
2715 static void
2716 check_cpu_arch_compatible (const char *name ATTRIBUTE_UNUSED,
2717 i386_cpu_flags new_flag ATTRIBUTE_UNUSED)
2718 {
2719 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
2720 static const char *arch;
2721
2722 /* Intel LIOM is only supported on ELF. */
2723 if (!IS_ELF)
2724 return;
2725
2726 if (!arch)
2727 {
2728 /* Use cpu_arch_name if it is set in md_parse_option. Otherwise
2729 use default_arch. */
2730 arch = cpu_arch_name;
2731 if (!arch)
2732 arch = default_arch;
2733 }
2734
2735 /* If we are targeting Intel MCU, we must enable it. */
2736 if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_IAMCU
2737 || new_flag.bitfield.cpuiamcu)
2738 return;
2739
2740 /* If we are targeting Intel L1OM, we must enable it. */
2741 if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_L1OM
2742 || new_flag.bitfield.cpul1om)
2743 return;
2744
2745 /* If we are targeting Intel K1OM, we must enable it. */
2746 if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_K1OM
2747 || new_flag.bitfield.cpuk1om)
2748 return;
2749
2750 as_bad (_("`%s' is not supported on `%s'"), name, arch);
2751 #endif
2752 }
2753
2754 static void
2755 set_cpu_arch (int dummy ATTRIBUTE_UNUSED)
2756 {
2757 SKIP_WHITESPACE ();
2758
2759 if (!is_end_of_line[(unsigned char) *input_line_pointer])
2760 {
2761 char *string;
2762 int e = get_symbol_name (&string);
2763 unsigned int j;
2764 i386_cpu_flags flags;
2765
2766 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
2767 {
2768 if (strcmp (string, cpu_arch[j].name) == 0)
2769 {
2770 check_cpu_arch_compatible (string, cpu_arch[j].flags);
2771
2772 if (*string != '.')
2773 {
2774 cpu_arch_name = cpu_arch[j].name;
2775 cpu_sub_arch_name = NULL;
2776 cpu_arch_flags = cpu_arch[j].flags;
2777 if (flag_code == CODE_64BIT)
2778 {
2779 cpu_arch_flags.bitfield.cpu64 = 1;
2780 cpu_arch_flags.bitfield.cpuno64 = 0;
2781 }
2782 else
2783 {
2784 cpu_arch_flags.bitfield.cpu64 = 0;
2785 cpu_arch_flags.bitfield.cpuno64 = 1;
2786 }
2787 cpu_arch_isa = cpu_arch[j].type;
2788 cpu_arch_isa_flags = cpu_arch[j].flags;
2789 if (!cpu_arch_tune_set)
2790 {
2791 cpu_arch_tune = cpu_arch_isa;
2792 cpu_arch_tune_flags = cpu_arch_isa_flags;
2793 }
2794 break;
2795 }
2796
2797 flags = cpu_flags_or (cpu_arch_flags,
2798 cpu_arch[j].flags);
2799
2800 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
2801 {
2802 if (cpu_sub_arch_name)
2803 {
2804 char *name = cpu_sub_arch_name;
2805 cpu_sub_arch_name = concat (name,
2806 cpu_arch[j].name,
2807 (const char *) NULL);
2808 free (name);
2809 }
2810 else
2811 cpu_sub_arch_name = xstrdup (cpu_arch[j].name);
2812 cpu_arch_flags = flags;
2813 cpu_arch_isa_flags = flags;
2814 }
2815 else
2816 cpu_arch_isa_flags
2817 = cpu_flags_or (cpu_arch_isa_flags,
2818 cpu_arch[j].flags);
2819 (void) restore_line_pointer (e);
2820 demand_empty_rest_of_line ();
2821 return;
2822 }
2823 }
2824
2825 if (*string == '.' && j >= ARRAY_SIZE (cpu_arch))
2826 {
2827 /* Disable an ISA extension. */
2828 for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
2829 if (strcmp (string + 1, cpu_noarch [j].name) == 0)
2830 {
2831 flags = cpu_flags_and_not (cpu_arch_flags,
2832 cpu_noarch[j].flags);
2833 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
2834 {
2835 if (cpu_sub_arch_name)
2836 {
2837 char *name = cpu_sub_arch_name;
2838 cpu_sub_arch_name = concat (name, string,
2839 (const char *) NULL);
2840 free (name);
2841 }
2842 else
2843 cpu_sub_arch_name = xstrdup (string);
2844 cpu_arch_flags = flags;
2845 cpu_arch_isa_flags = flags;
2846 }
2847 (void) restore_line_pointer (e);
2848 demand_empty_rest_of_line ();
2849 return;
2850 }
2851
2852 j = ARRAY_SIZE (cpu_arch);
2853 }
2854
2855 if (j >= ARRAY_SIZE (cpu_arch))
2856 as_bad (_("no such architecture: `%s'"), string);
2857
2858 *input_line_pointer = e;
2859 }
2860 else
2861 as_bad (_("missing cpu architecture"));
2862
2863 no_cond_jump_promotion = 0;
2864 if (*input_line_pointer == ','
2865 && !is_end_of_line[(unsigned char) input_line_pointer[1]])
2866 {
2867 char *string;
2868 char e;
2869
2870 ++input_line_pointer;
2871 e = get_symbol_name (&string);
2872
2873 if (strcmp (string, "nojumps") == 0)
2874 no_cond_jump_promotion = 1;
2875 else if (strcmp (string, "jumps") == 0)
2876 ;
2877 else
2878 as_bad (_("no such architecture modifier: `%s'"), string);
2879
2880 (void) restore_line_pointer (e);
2881 }
2882
2883 demand_empty_rest_of_line ();
2884 }
2885
2886 enum bfd_architecture
2887 i386_arch (void)
2888 {
2889 if (cpu_arch_isa == PROCESSOR_L1OM)
2890 {
2891 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2892 || flag_code != CODE_64BIT)
2893 as_fatal (_("Intel L1OM is 64bit ELF only"));
2894 return bfd_arch_l1om;
2895 }
2896 else if (cpu_arch_isa == PROCESSOR_K1OM)
2897 {
2898 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2899 || flag_code != CODE_64BIT)
2900 as_fatal (_("Intel K1OM is 64bit ELF only"));
2901 return bfd_arch_k1om;
2902 }
2903 else if (cpu_arch_isa == PROCESSOR_IAMCU)
2904 {
2905 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2906 || flag_code == CODE_64BIT)
2907 as_fatal (_("Intel MCU is 32bit ELF only"));
2908 return bfd_arch_iamcu;
2909 }
2910 else
2911 return bfd_arch_i386;
2912 }
2913
2914 unsigned long
2915 i386_mach (void)
2916 {
2917 if (!strncmp (default_arch, "x86_64", 6))
2918 {
2919 if (cpu_arch_isa == PROCESSOR_L1OM)
2920 {
2921 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2922 || default_arch[6] != '\0')
2923 as_fatal (_("Intel L1OM is 64bit ELF only"));
2924 return bfd_mach_l1om;
2925 }
2926 else if (cpu_arch_isa == PROCESSOR_K1OM)
2927 {
2928 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2929 || default_arch[6] != '\0')
2930 as_fatal (_("Intel K1OM is 64bit ELF only"));
2931 return bfd_mach_k1om;
2932 }
2933 else if (default_arch[6] == '\0')
2934 return bfd_mach_x86_64;
2935 else
2936 return bfd_mach_x64_32;
2937 }
2938 else if (!strcmp (default_arch, "i386")
2939 || !strcmp (default_arch, "iamcu"))
2940 {
2941 if (cpu_arch_isa == PROCESSOR_IAMCU)
2942 {
2943 if (OUTPUT_FLAVOR != bfd_target_elf_flavour)
2944 as_fatal (_("Intel MCU is 32bit ELF only"));
2945 return bfd_mach_i386_iamcu;
2946 }
2947 else
2948 return bfd_mach_i386_i386;
2949 }
2950 else
2951 as_fatal (_("unknown architecture"));
2952 }
2953 \f
2954 void
2955 md_begin (void)
2956 {
2957 const char *hash_err;
2958
2959 /* Support pseudo prefixes like {disp32}. */
2960 lex_type ['{'] = LEX_BEGIN_NAME;
2961
2962 /* Initialize op_hash hash table. */
2963 op_hash = hash_new ();
2964
2965 {
2966 const insn_template *optab;
2967 templates *core_optab;
2968
2969 /* Setup for loop. */
2970 optab = i386_optab;
2971 core_optab = XNEW (templates);
2972 core_optab->start = optab;
2973
2974 while (1)
2975 {
2976 ++optab;
2977 if (optab->name == NULL
2978 || strcmp (optab->name, (optab - 1)->name) != 0)
2979 {
2980 /* different name --> ship out current template list;
2981 add to hash table; & begin anew. */
2982 core_optab->end = optab;
2983 hash_err = hash_insert (op_hash,
2984 (optab - 1)->name,
2985 (void *) core_optab);
2986 if (hash_err)
2987 {
2988 as_fatal (_("can't hash %s: %s"),
2989 (optab - 1)->name,
2990 hash_err);
2991 }
2992 if (optab->name == NULL)
2993 break;
2994 core_optab = XNEW (templates);
2995 core_optab->start = optab;
2996 }
2997 }
2998 }
2999
3000 /* Initialize reg_hash hash table. */
3001 reg_hash = hash_new ();
3002 {
3003 const reg_entry *regtab;
3004 unsigned int regtab_size = i386_regtab_size;
3005
3006 for (regtab = i386_regtab; regtab_size--; regtab++)
3007 {
3008 hash_err = hash_insert (reg_hash, regtab->reg_name, (void *) regtab);
3009 if (hash_err)
3010 as_fatal (_("can't hash %s: %s"),
3011 regtab->reg_name,
3012 hash_err);
3013 }
3014 }
3015
3016 /* Fill in lexical tables: mnemonic_chars, operand_chars. */
3017 {
3018 int c;
3019 char *p;
3020
3021 for (c = 0; c < 256; c++)
3022 {
3023 if (ISDIGIT (c))
3024 {
3025 digit_chars[c] = c;
3026 mnemonic_chars[c] = c;
3027 register_chars[c] = c;
3028 operand_chars[c] = c;
3029 }
3030 else if (ISLOWER (c))
3031 {
3032 mnemonic_chars[c] = c;
3033 register_chars[c] = c;
3034 operand_chars[c] = c;
3035 }
3036 else if (ISUPPER (c))
3037 {
3038 mnemonic_chars[c] = TOLOWER (c);
3039 register_chars[c] = mnemonic_chars[c];
3040 operand_chars[c] = c;
3041 }
3042 else if (c == '{' || c == '}')
3043 {
3044 mnemonic_chars[c] = c;
3045 operand_chars[c] = c;
3046 }
3047
3048 if (ISALPHA (c) || ISDIGIT (c))
3049 identifier_chars[c] = c;
3050 else if (c >= 128)
3051 {
3052 identifier_chars[c] = c;
3053 operand_chars[c] = c;
3054 }
3055 }
3056
3057 #ifdef LEX_AT
3058 identifier_chars['@'] = '@';
3059 #endif
3060 #ifdef LEX_QM
3061 identifier_chars['?'] = '?';
3062 operand_chars['?'] = '?';
3063 #endif
3064 digit_chars['-'] = '-';
3065 mnemonic_chars['_'] = '_';
3066 mnemonic_chars['-'] = '-';
3067 mnemonic_chars['.'] = '.';
3068 identifier_chars['_'] = '_';
3069 identifier_chars['.'] = '.';
3070
3071 for (p = operand_special_chars; *p != '\0'; p++)
3072 operand_chars[(unsigned char) *p] = *p;
3073 }
3074
3075 if (flag_code == CODE_64BIT)
3076 {
3077 #if defined (OBJ_COFF) && defined (TE_PE)
3078 x86_dwarf2_return_column = (OUTPUT_FLAVOR == bfd_target_coff_flavour
3079 ? 32 : 16);
3080 #else
3081 x86_dwarf2_return_column = 16;
3082 #endif
3083 x86_cie_data_alignment = -8;
3084 }
3085 else
3086 {
3087 x86_dwarf2_return_column = 8;
3088 x86_cie_data_alignment = -4;
3089 }
3090
3091 /* NB: FUSED_JCC_PADDING frag must have sufficient room so that it
3092 can be turned into BRANCH_PREFIX frag. */
3093 if (align_branch_prefix_size > MAX_FUSED_JCC_PADDING_SIZE)
3094 abort ();
3095 }
3096
3097 void
3098 i386_print_statistics (FILE *file)
3099 {
3100 hash_print_statistics (file, "i386 opcode", op_hash);
3101 hash_print_statistics (file, "i386 register", reg_hash);
3102 }
3103 \f
3104 #ifdef DEBUG386
3105
3106 /* Debugging routines for md_assemble. */
3107 static void pte (insn_template *);
3108 static void pt (i386_operand_type);
3109 static void pe (expressionS *);
3110 static void ps (symbolS *);
3111
3112 static void
3113 pi (const char *line, i386_insn *x)
3114 {
3115 unsigned int j;
3116
3117 fprintf (stdout, "%s: template ", line);
3118 pte (&x->tm);
3119 fprintf (stdout, " address: base %s index %s scale %x\n",
3120 x->base_reg ? x->base_reg->reg_name : "none",
3121 x->index_reg ? x->index_reg->reg_name : "none",
3122 x->log2_scale_factor);
3123 fprintf (stdout, " modrm: mode %x reg %x reg/mem %x\n",
3124 x->rm.mode, x->rm.reg, x->rm.regmem);
3125 fprintf (stdout, " sib: base %x index %x scale %x\n",
3126 x->sib.base, x->sib.index, x->sib.scale);
3127 fprintf (stdout, " rex: 64bit %x extX %x extY %x extZ %x\n",
3128 (x->rex & REX_W) != 0,
3129 (x->rex & REX_R) != 0,
3130 (x->rex & REX_X) != 0,
3131 (x->rex & REX_B) != 0);
3132 for (j = 0; j < x->operands; j++)
3133 {
3134 fprintf (stdout, " #%d: ", j + 1);
3135 pt (x->types[j]);
3136 fprintf (stdout, "\n");
3137 if (x->types[j].bitfield.class == Reg
3138 || x->types[j].bitfield.class == RegMMX
3139 || x->types[j].bitfield.class == RegSIMD
3140 || x->types[j].bitfield.class == SReg
3141 || x->types[j].bitfield.class == RegCR
3142 || x->types[j].bitfield.class == RegDR
3143 || x->types[j].bitfield.class == RegTR)
3144 fprintf (stdout, "%s\n", x->op[j].regs->reg_name);
3145 if (operand_type_check (x->types[j], imm))
3146 pe (x->op[j].imms);
3147 if (operand_type_check (x->types[j], disp))
3148 pe (x->op[j].disps);
3149 }
3150 }
3151
3152 static void
3153 pte (insn_template *t)
3154 {
3155 unsigned int j;
3156 fprintf (stdout, " %d operands ", t->operands);
3157 fprintf (stdout, "opcode %x ", t->base_opcode);
3158 if (t->extension_opcode != None)
3159 fprintf (stdout, "ext %x ", t->extension_opcode);
3160 if (t->opcode_modifier.d)
3161 fprintf (stdout, "D");
3162 if (t->opcode_modifier.w)
3163 fprintf (stdout, "W");
3164 fprintf (stdout, "\n");
3165 for (j = 0; j < t->operands; j++)
3166 {
3167 fprintf (stdout, " #%d type ", j + 1);
3168 pt (t->operand_types[j]);
3169 fprintf (stdout, "\n");
3170 }
3171 }
3172
3173 static void
3174 pe (expressionS *e)
3175 {
3176 fprintf (stdout, " operation %d\n", e->X_op);
3177 fprintf (stdout, " add_number %ld (%lx)\n",
3178 (long) e->X_add_number, (long) e->X_add_number);
3179 if (e->X_add_symbol)
3180 {
3181 fprintf (stdout, " add_symbol ");
3182 ps (e->X_add_symbol);
3183 fprintf (stdout, "\n");
3184 }
3185 if (e->X_op_symbol)
3186 {
3187 fprintf (stdout, " op_symbol ");
3188 ps (e->X_op_symbol);
3189 fprintf (stdout, "\n");
3190 }
3191 }
3192
3193 static void
3194 ps (symbolS *s)
3195 {
3196 fprintf (stdout, "%s type %s%s",
3197 S_GET_NAME (s),
3198 S_IS_EXTERNAL (s) ? "EXTERNAL " : "",
3199 segment_name (S_GET_SEGMENT (s)));
3200 }
3201
3202 static struct type_name
3203 {
3204 i386_operand_type mask;
3205 const char *name;
3206 }
3207 const type_names[] =
3208 {
3209 { OPERAND_TYPE_REG8, "r8" },
3210 { OPERAND_TYPE_REG16, "r16" },
3211 { OPERAND_TYPE_REG32, "r32" },
3212 { OPERAND_TYPE_REG64, "r64" },
3213 { OPERAND_TYPE_ACC8, "acc8" },
3214 { OPERAND_TYPE_ACC16, "acc16" },
3215 { OPERAND_TYPE_ACC32, "acc32" },
3216 { OPERAND_TYPE_ACC64, "acc64" },
3217 { OPERAND_TYPE_IMM8, "i8" },
3218 { OPERAND_TYPE_IMM8, "i8s" },
3219 { OPERAND_TYPE_IMM16, "i16" },
3220 { OPERAND_TYPE_IMM32, "i32" },
3221 { OPERAND_TYPE_IMM32S, "i32s" },
3222 { OPERAND_TYPE_IMM64, "i64" },
3223 { OPERAND_TYPE_IMM1, "i1" },
3224 { OPERAND_TYPE_BASEINDEX, "BaseIndex" },
3225 { OPERAND_TYPE_DISP8, "d8" },
3226 { OPERAND_TYPE_DISP16, "d16" },
3227 { OPERAND_TYPE_DISP32, "d32" },
3228 { OPERAND_TYPE_DISP32S, "d32s" },
3229 { OPERAND_TYPE_DISP64, "d64" },
3230 { OPERAND_TYPE_INOUTPORTREG, "InOutPortReg" },
3231 { OPERAND_TYPE_SHIFTCOUNT, "ShiftCount" },
3232 { OPERAND_TYPE_CONTROL, "control reg" },
3233 { OPERAND_TYPE_TEST, "test reg" },
3234 { OPERAND_TYPE_DEBUG, "debug reg" },
3235 { OPERAND_TYPE_FLOATREG, "FReg" },
3236 { OPERAND_TYPE_FLOATACC, "FAcc" },
3237 { OPERAND_TYPE_SREG, "SReg" },
3238 { OPERAND_TYPE_REGMMX, "rMMX" },
3239 { OPERAND_TYPE_REGXMM, "rXMM" },
3240 { OPERAND_TYPE_REGYMM, "rYMM" },
3241 { OPERAND_TYPE_REGZMM, "rZMM" },
3242 { OPERAND_TYPE_REGMASK, "Mask reg" },
3243 };
3244
3245 static void
3246 pt (i386_operand_type t)
3247 {
3248 unsigned int j;
3249 i386_operand_type a;
3250
3251 for (j = 0; j < ARRAY_SIZE (type_names); j++)
3252 {
3253 a = operand_type_and (t, type_names[j].mask);
3254 if (operand_type_equal (&a, &type_names[j].mask))
3255 fprintf (stdout, "%s, ", type_names[j].name);
3256 }
3257 fflush (stdout);
3258 }
3259
3260 #endif /* DEBUG386 */
3261 \f
3262 static bfd_reloc_code_real_type
3263 reloc (unsigned int size,
3264 int pcrel,
3265 int sign,
3266 bfd_reloc_code_real_type other)
3267 {
3268 if (other != NO_RELOC)
3269 {
3270 reloc_howto_type *rel;
3271
3272 if (size == 8)
3273 switch (other)
3274 {
3275 case BFD_RELOC_X86_64_GOT32:
3276 return BFD_RELOC_X86_64_GOT64;
3277 break;
3278 case BFD_RELOC_X86_64_GOTPLT64:
3279 return BFD_RELOC_X86_64_GOTPLT64;
3280 break;
3281 case BFD_RELOC_X86_64_PLTOFF64:
3282 return BFD_RELOC_X86_64_PLTOFF64;
3283 break;
3284 case BFD_RELOC_X86_64_GOTPC32:
3285 other = BFD_RELOC_X86_64_GOTPC64;
3286 break;
3287 case BFD_RELOC_X86_64_GOTPCREL:
3288 other = BFD_RELOC_X86_64_GOTPCREL64;
3289 break;
3290 case BFD_RELOC_X86_64_TPOFF32:
3291 other = BFD_RELOC_X86_64_TPOFF64;
3292 break;
3293 case BFD_RELOC_X86_64_DTPOFF32:
3294 other = BFD_RELOC_X86_64_DTPOFF64;
3295 break;
3296 default:
3297 break;
3298 }
3299
3300 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
3301 if (other == BFD_RELOC_SIZE32)
3302 {
3303 if (size == 8)
3304 other = BFD_RELOC_SIZE64;
3305 if (pcrel)
3306 {
3307 as_bad (_("there are no pc-relative size relocations"));
3308 return NO_RELOC;
3309 }
3310 }
3311 #endif
3312
3313 /* Sign-checking 4-byte relocations in 16-/32-bit code is pointless. */
3314 if (size == 4 && (flag_code != CODE_64BIT || disallow_64bit_reloc))
3315 sign = -1;
3316
3317 rel = bfd_reloc_type_lookup (stdoutput, other);
3318 if (!rel)
3319 as_bad (_("unknown relocation (%u)"), other);
3320 else if (size != bfd_get_reloc_size (rel))
3321 as_bad (_("%u-byte relocation cannot be applied to %u-byte field"),
3322 bfd_get_reloc_size (rel),
3323 size);
3324 else if (pcrel && !rel->pc_relative)
3325 as_bad (_("non-pc-relative relocation for pc-relative field"));
3326 else if ((rel->complain_on_overflow == complain_overflow_signed
3327 && !sign)
3328 || (rel->complain_on_overflow == complain_overflow_unsigned
3329 && sign > 0))
3330 as_bad (_("relocated field and relocation type differ in signedness"));
3331 else
3332 return other;
3333 return NO_RELOC;
3334 }
3335
3336 if (pcrel)
3337 {
3338 if (!sign)
3339 as_bad (_("there are no unsigned pc-relative relocations"));
3340 switch (size)
3341 {
3342 case 1: return BFD_RELOC_8_PCREL;
3343 case 2: return BFD_RELOC_16_PCREL;
3344 case 4: return BFD_RELOC_32_PCREL;
3345 case 8: return BFD_RELOC_64_PCREL;
3346 }
3347 as_bad (_("cannot do %u byte pc-relative relocation"), size);
3348 }
3349 else
3350 {
3351 if (sign > 0)
3352 switch (size)
3353 {
3354 case 4: return BFD_RELOC_X86_64_32S;
3355 }
3356 else
3357 switch (size)
3358 {
3359 case 1: return BFD_RELOC_8;
3360 case 2: return BFD_RELOC_16;
3361 case 4: return BFD_RELOC_32;
3362 case 8: return BFD_RELOC_64;
3363 }
3364 as_bad (_("cannot do %s %u byte relocation"),
3365 sign > 0 ? "signed" : "unsigned", size);
3366 }
3367
3368 return NO_RELOC;
3369 }
3370
3371 /* Here we decide which fixups can be adjusted to make them relative to
3372 the beginning of the section instead of the symbol. Basically we need
3373 to make sure that the dynamic relocations are done correctly, so in
3374 some cases we force the original symbol to be used. */
3375
3376 int
3377 tc_i386_fix_adjustable (fixS *fixP ATTRIBUTE_UNUSED)
3378 {
3379 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
3380 if (!IS_ELF)
3381 return 1;
3382
3383 /* Don't adjust pc-relative references to merge sections in 64-bit
3384 mode. */
3385 if (use_rela_relocations
3386 && (S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_MERGE) != 0
3387 && fixP->fx_pcrel)
3388 return 0;
3389
3390 /* The x86_64 GOTPCREL are represented as 32bit PCrel relocations
3391 and changed later by validate_fix. */
3392 if (GOT_symbol && fixP->fx_subsy == GOT_symbol
3393 && fixP->fx_r_type == BFD_RELOC_32_PCREL)
3394 return 0;
3395
3396 /* Adjust_reloc_syms doesn't know about the GOT. Need to keep symbol
3397 for size relocations. */
3398 if (fixP->fx_r_type == BFD_RELOC_SIZE32
3399 || fixP->fx_r_type == BFD_RELOC_SIZE64
3400 || fixP->fx_r_type == BFD_RELOC_386_GOTOFF
3401 || fixP->fx_r_type == BFD_RELOC_386_GOT32
3402 || fixP->fx_r_type == BFD_RELOC_386_GOT32X
3403 || fixP->fx_r_type == BFD_RELOC_386_TLS_GD
3404 || fixP->fx_r_type == BFD_RELOC_386_TLS_LDM
3405 || fixP->fx_r_type == BFD_RELOC_386_TLS_LDO_32
3406 || fixP->fx_r_type == BFD_RELOC_386_TLS_IE_32
3407 || fixP->fx_r_type == BFD_RELOC_386_TLS_IE
3408 || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTIE
3409 || fixP->fx_r_type == BFD_RELOC_386_TLS_LE_32
3410 || fixP->fx_r_type == BFD_RELOC_386_TLS_LE
3411 || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTDESC
3412 || fixP->fx_r_type == BFD_RELOC_386_TLS_DESC_CALL
3413 || fixP->fx_r_type == BFD_RELOC_X86_64_GOT32
3414 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCREL
3415 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCRELX
3416 || fixP->fx_r_type == BFD_RELOC_X86_64_REX_GOTPCRELX
3417 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSGD
3418 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSLD
3419 || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF32
3420 || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF64
3421 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTTPOFF
3422 || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF32
3423 || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF64
3424 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTOFF64
3425 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPC32_TLSDESC
3426 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSDESC_CALL
3427 || fixP->fx_r_type == BFD_RELOC_VTABLE_INHERIT
3428 || fixP->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
3429 return 0;
3430 #endif
3431 return 1;
3432 }
3433
3434 static int
3435 intel_float_operand (const char *mnemonic)
3436 {
3437 /* Note that the value returned is meaningful only for opcodes with (memory)
3438 operands, hence the code here is free to improperly handle opcodes that
3439 have no operands (for better performance and smaller code). */
3440
3441 if (mnemonic[0] != 'f')
3442 return 0; /* non-math */
3443
3444 switch (mnemonic[1])
3445 {
3446 /* fclex, fdecstp, fdisi, femms, feni, fincstp, finit, fsetpm, and
3447 the fs segment override prefix not currently handled because no
3448 call path can make opcodes without operands get here */
3449 case 'i':
3450 return 2 /* integer op */;
3451 case 'l':
3452 if (mnemonic[2] == 'd' && (mnemonic[3] == 'c' || mnemonic[3] == 'e'))
3453 return 3; /* fldcw/fldenv */
3454 break;
3455 case 'n':
3456 if (mnemonic[2] != 'o' /* fnop */)
3457 return 3; /* non-waiting control op */
3458 break;
3459 case 'r':
3460 if (mnemonic[2] == 's')
3461 return 3; /* frstor/frstpm */
3462 break;
3463 case 's':
3464 if (mnemonic[2] == 'a')
3465 return 3; /* fsave */
3466 if (mnemonic[2] == 't')
3467 {
3468 switch (mnemonic[3])
3469 {
3470 case 'c': /* fstcw */
3471 case 'd': /* fstdw */
3472 case 'e': /* fstenv */
3473 case 's': /* fsts[gw] */
3474 return 3;
3475 }
3476 }
3477 break;
3478 case 'x':
3479 if (mnemonic[2] == 'r' || mnemonic[2] == 's')
3480 return 0; /* fxsave/fxrstor are not really math ops */
3481 break;
3482 }
3483
3484 return 1;
3485 }
3486
3487 /* Build the VEX prefix. */
3488
3489 static void
3490 build_vex_prefix (const insn_template *t)
3491 {
3492 unsigned int register_specifier;
3493 unsigned int implied_prefix;
3494 unsigned int vector_length;
3495 unsigned int w;
3496
3497 /* Check register specifier. */
3498 if (i.vex.register_specifier)
3499 {
3500 register_specifier =
3501 ~register_number (i.vex.register_specifier) & 0xf;
3502 gas_assert ((i.vex.register_specifier->reg_flags & RegVRex) == 0);
3503 }
3504 else
3505 register_specifier = 0xf;
3506
3507 /* Use 2-byte VEX prefix by swapping destination and source operand
3508 if there are more than 1 register operand. */
3509 if (i.reg_operands > 1
3510 && i.vec_encoding != vex_encoding_vex3
3511 && i.dir_encoding == dir_encoding_default
3512 && i.operands == i.reg_operands
3513 && operand_type_equal (&i.types[0], &i.types[i.operands - 1])
3514 && i.tm.opcode_modifier.vexopcode == VEX0F
3515 && (i.tm.opcode_modifier.load || i.tm.opcode_modifier.d)
3516 && i.rex == REX_B)
3517 {
3518 unsigned int xchg = i.operands - 1;
3519 union i386_op temp_op;
3520 i386_operand_type temp_type;
3521
3522 temp_type = i.types[xchg];
3523 i.types[xchg] = i.types[0];
3524 i.types[0] = temp_type;
3525 temp_op = i.op[xchg];
3526 i.op[xchg] = i.op[0];
3527 i.op[0] = temp_op;
3528
3529 gas_assert (i.rm.mode == 3);
3530
3531 i.rex = REX_R;
3532 xchg = i.rm.regmem;
3533 i.rm.regmem = i.rm.reg;
3534 i.rm.reg = xchg;
3535
3536 if (i.tm.opcode_modifier.d)
3537 i.tm.base_opcode ^= (i.tm.base_opcode & 0xee) != 0x6e
3538 ? Opcode_SIMD_FloatD : Opcode_SIMD_IntD;
3539 else /* Use the next insn. */
3540 i.tm = t[1];
3541 }
3542
3543 /* Use 2-byte VEX prefix by swapping commutative source operands if there
3544 are no memory operands and at least 3 register ones. */
3545 if (i.reg_operands >= 3
3546 && i.vec_encoding != vex_encoding_vex3
3547 && i.reg_operands == i.operands - i.imm_operands
3548 && i.tm.opcode_modifier.vex
3549 && i.tm.opcode_modifier.commutative
3550 && (i.tm.opcode_modifier.sse2avx || optimize > 1)
3551 && i.rex == REX_B
3552 && i.vex.register_specifier
3553 && !(i.vex.register_specifier->reg_flags & RegRex))
3554 {
3555 unsigned int xchg = i.operands - i.reg_operands;
3556 union i386_op temp_op;
3557 i386_operand_type temp_type;
3558
3559 gas_assert (i.tm.opcode_modifier.vexopcode == VEX0F);
3560 gas_assert (!i.tm.opcode_modifier.sae);
3561 gas_assert (operand_type_equal (&i.types[i.operands - 2],
3562 &i.types[i.operands - 3]));
3563 gas_assert (i.rm.mode == 3);
3564
3565 temp_type = i.types[xchg];
3566 i.types[xchg] = i.types[xchg + 1];
3567 i.types[xchg + 1] = temp_type;
3568 temp_op = i.op[xchg];
3569 i.op[xchg] = i.op[xchg + 1];
3570 i.op[xchg + 1] = temp_op;
3571
3572 i.rex = 0;
3573 xchg = i.rm.regmem | 8;
3574 i.rm.regmem = ~register_specifier & 0xf;
3575 gas_assert (!(i.rm.regmem & 8));
3576 i.vex.register_specifier += xchg - i.rm.regmem;
3577 register_specifier = ~xchg & 0xf;
3578 }
3579
3580 if (i.tm.opcode_modifier.vex == VEXScalar)
3581 vector_length = avxscalar;
3582 else if (i.tm.opcode_modifier.vex == VEX256)
3583 vector_length = 1;
3584 else
3585 {
3586 unsigned int op;
3587
3588 /* Determine vector length from the last multi-length vector
3589 operand. */
3590 vector_length = 0;
3591 for (op = t->operands; op--;)
3592 if (t->operand_types[op].bitfield.xmmword
3593 && t->operand_types[op].bitfield.ymmword
3594 && i.types[op].bitfield.ymmword)
3595 {
3596 vector_length = 1;
3597 break;
3598 }
3599 }
3600
3601 switch ((i.tm.base_opcode >> 8) & 0xff)
3602 {
3603 case 0:
3604 implied_prefix = 0;
3605 break;
3606 case DATA_PREFIX_OPCODE:
3607 implied_prefix = 1;
3608 break;
3609 case REPE_PREFIX_OPCODE:
3610 implied_prefix = 2;
3611 break;
3612 case REPNE_PREFIX_OPCODE:
3613 implied_prefix = 3;
3614 break;
3615 default:
3616 abort ();
3617 }
3618
3619 /* Check the REX.W bit and VEXW. */
3620 if (i.tm.opcode_modifier.vexw == VEXWIG)
3621 w = (vexwig == vexw1 || (i.rex & REX_W)) ? 1 : 0;
3622 else if (i.tm.opcode_modifier.vexw)
3623 w = i.tm.opcode_modifier.vexw == VEXW1 ? 1 : 0;
3624 else
3625 w = (flag_code == CODE_64BIT ? i.rex & REX_W : vexwig == vexw1) ? 1 : 0;
3626
3627 /* Use 2-byte VEX prefix if possible. */
3628 if (w == 0
3629 && i.vec_encoding != vex_encoding_vex3
3630 && i.tm.opcode_modifier.vexopcode == VEX0F
3631 && (i.rex & (REX_W | REX_X | REX_B)) == 0)
3632 {
3633 /* 2-byte VEX prefix. */
3634 unsigned int r;
3635
3636 i.vex.length = 2;
3637 i.vex.bytes[0] = 0xc5;
3638
3639 /* Check the REX.R bit. */
3640 r = (i.rex & REX_R) ? 0 : 1;
3641 i.vex.bytes[1] = (r << 7
3642 | register_specifier << 3
3643 | vector_length << 2
3644 | implied_prefix);
3645 }
3646 else
3647 {
3648 /* 3-byte VEX prefix. */
3649 unsigned int m;
3650
3651 i.vex.length = 3;
3652
3653 switch (i.tm.opcode_modifier.vexopcode)
3654 {
3655 case VEX0F:
3656 m = 0x1;
3657 i.vex.bytes[0] = 0xc4;
3658 break;
3659 case VEX0F38:
3660 m = 0x2;
3661 i.vex.bytes[0] = 0xc4;
3662 break;
3663 case VEX0F3A:
3664 m = 0x3;
3665 i.vex.bytes[0] = 0xc4;
3666 break;
3667 case XOP08:
3668 m = 0x8;
3669 i.vex.bytes[0] = 0x8f;
3670 break;
3671 case XOP09:
3672 m = 0x9;
3673 i.vex.bytes[0] = 0x8f;
3674 break;
3675 case XOP0A:
3676 m = 0xa;
3677 i.vex.bytes[0] = 0x8f;
3678 break;
3679 default:
3680 abort ();
3681 }
3682
3683 /* The high 3 bits of the second VEX byte are 1's compliment
3684 of RXB bits from REX. */
3685 i.vex.bytes[1] = (~i.rex & 0x7) << 5 | m;
3686
3687 i.vex.bytes[2] = (w << 7
3688 | register_specifier << 3
3689 | vector_length << 2
3690 | implied_prefix);
3691 }
3692 }
3693
3694 static INLINE bfd_boolean
3695 is_evex_encoding (const insn_template *t)
3696 {
3697 return t->opcode_modifier.evex || t->opcode_modifier.disp8memshift
3698 || t->opcode_modifier.broadcast || t->opcode_modifier.masking
3699 || t->opcode_modifier.sae;
3700 }
3701
3702 static INLINE bfd_boolean
3703 is_any_vex_encoding (const insn_template *t)
3704 {
3705 return t->opcode_modifier.vex || t->opcode_modifier.vexopcode
3706 || is_evex_encoding (t);
3707 }
3708
3709 /* Build the EVEX prefix. */
3710
3711 static void
3712 build_evex_prefix (void)
3713 {
3714 unsigned int register_specifier;
3715 unsigned int implied_prefix;
3716 unsigned int m, w;
3717 rex_byte vrex_used = 0;
3718
3719 /* Check register specifier. */
3720 if (i.vex.register_specifier)
3721 {
3722 gas_assert ((i.vrex & REX_X) == 0);
3723
3724 register_specifier = i.vex.register_specifier->reg_num;
3725 if ((i.vex.register_specifier->reg_flags & RegRex))
3726 register_specifier += 8;
3727 /* The upper 16 registers are encoded in the fourth byte of the
3728 EVEX prefix. */
3729 if (!(i.vex.register_specifier->reg_flags & RegVRex))
3730 i.vex.bytes[3] = 0x8;
3731 register_specifier = ~register_specifier & 0xf;
3732 }
3733 else
3734 {
3735 register_specifier = 0xf;
3736
3737 /* Encode upper 16 vector index register in the fourth byte of
3738 the EVEX prefix. */
3739 if (!(i.vrex & REX_X))
3740 i.vex.bytes[3] = 0x8;
3741 else
3742 vrex_used |= REX_X;
3743 }
3744
3745 switch ((i.tm.base_opcode >> 8) & 0xff)
3746 {
3747 case 0:
3748 implied_prefix = 0;
3749 break;
3750 case DATA_PREFIX_OPCODE:
3751 implied_prefix = 1;
3752 break;
3753 case REPE_PREFIX_OPCODE:
3754 implied_prefix = 2;
3755 break;
3756 case REPNE_PREFIX_OPCODE:
3757 implied_prefix = 3;
3758 break;
3759 default:
3760 abort ();
3761 }
3762
3763 /* 4 byte EVEX prefix. */
3764 i.vex.length = 4;
3765 i.vex.bytes[0] = 0x62;
3766
3767 /* mmmm bits. */
3768 switch (i.tm.opcode_modifier.vexopcode)
3769 {
3770 case VEX0F:
3771 m = 1;
3772 break;
3773 case VEX0F38:
3774 m = 2;
3775 break;
3776 case VEX0F3A:
3777 m = 3;
3778 break;
3779 default:
3780 abort ();
3781 break;
3782 }
3783
3784 /* The high 3 bits of the second EVEX byte are 1's compliment of RXB
3785 bits from REX. */
3786 i.vex.bytes[1] = (~i.rex & 0x7) << 5 | m;
3787
3788 /* The fifth bit of the second EVEX byte is 1's compliment of the
3789 REX_R bit in VREX. */
3790 if (!(i.vrex & REX_R))
3791 i.vex.bytes[1] |= 0x10;
3792 else
3793 vrex_used |= REX_R;
3794
3795 if ((i.reg_operands + i.imm_operands) == i.operands)
3796 {
3797 /* When all operands are registers, the REX_X bit in REX is not
3798 used. We reuse it to encode the upper 16 registers, which is
3799 indicated by the REX_B bit in VREX. The REX_X bit is encoded
3800 as 1's compliment. */
3801 if ((i.vrex & REX_B))
3802 {
3803 vrex_used |= REX_B;
3804 i.vex.bytes[1] &= ~0x40;
3805 }
3806 }
3807
3808 /* EVEX instructions shouldn't need the REX prefix. */
3809 i.vrex &= ~vrex_used;
3810 gas_assert (i.vrex == 0);
3811
3812 /* Check the REX.W bit and VEXW. */
3813 if (i.tm.opcode_modifier.vexw == VEXWIG)
3814 w = (evexwig == evexw1 || (i.rex & REX_W)) ? 1 : 0;
3815 else if (i.tm.opcode_modifier.vexw)
3816 w = i.tm.opcode_modifier.vexw == VEXW1 ? 1 : 0;
3817 else
3818 w = (flag_code == CODE_64BIT ? i.rex & REX_W : evexwig == evexw1) ? 1 : 0;
3819
3820 /* Encode the U bit. */
3821 implied_prefix |= 0x4;
3822
3823 /* The third byte of the EVEX prefix. */
3824 i.vex.bytes[2] = (w << 7 | register_specifier << 3 | implied_prefix);
3825
3826 /* The fourth byte of the EVEX prefix. */
3827 /* The zeroing-masking bit. */
3828 if (i.mask && i.mask->zeroing)
3829 i.vex.bytes[3] |= 0x80;
3830
3831 /* Don't always set the broadcast bit if there is no RC. */
3832 if (!i.rounding)
3833 {
3834 /* Encode the vector length. */
3835 unsigned int vec_length;
3836
3837 if (!i.tm.opcode_modifier.evex
3838 || i.tm.opcode_modifier.evex == EVEXDYN)
3839 {
3840 unsigned int op;
3841
3842 /* Determine vector length from the last multi-length vector
3843 operand. */
3844 vec_length = 0;
3845 for (op = i.operands; op--;)
3846 if (i.tm.operand_types[op].bitfield.xmmword
3847 + i.tm.operand_types[op].bitfield.ymmword
3848 + i.tm.operand_types[op].bitfield.zmmword > 1)
3849 {
3850 if (i.types[op].bitfield.zmmword)
3851 {
3852 i.tm.opcode_modifier.evex = EVEX512;
3853 break;
3854 }
3855 else if (i.types[op].bitfield.ymmword)
3856 {
3857 i.tm.opcode_modifier.evex = EVEX256;
3858 break;
3859 }
3860 else if (i.types[op].bitfield.xmmword)
3861 {
3862 i.tm.opcode_modifier.evex = EVEX128;
3863 break;
3864 }
3865 else if (i.broadcast && (int) op == i.broadcast->operand)
3866 {
3867 switch (i.broadcast->bytes)
3868 {
3869 case 64:
3870 i.tm.opcode_modifier.evex = EVEX512;
3871 break;
3872 case 32:
3873 i.tm.opcode_modifier.evex = EVEX256;
3874 break;
3875 case 16:
3876 i.tm.opcode_modifier.evex = EVEX128;
3877 break;
3878 default:
3879 abort ();
3880 }
3881 break;
3882 }
3883 }
3884
3885 if (op >= MAX_OPERANDS)
3886 abort ();
3887 }
3888
3889 switch (i.tm.opcode_modifier.evex)
3890 {
3891 case EVEXLIG: /* LL' is ignored */
3892 vec_length = evexlig << 5;
3893 break;
3894 case EVEX128:
3895 vec_length = 0 << 5;
3896 break;
3897 case EVEX256:
3898 vec_length = 1 << 5;
3899 break;
3900 case EVEX512:
3901 vec_length = 2 << 5;
3902 break;
3903 default:
3904 abort ();
3905 break;
3906 }
3907 i.vex.bytes[3] |= vec_length;
3908 /* Encode the broadcast bit. */
3909 if (i.broadcast)
3910 i.vex.bytes[3] |= 0x10;
3911 }
3912 else
3913 {
3914 if (i.rounding->type != saeonly)
3915 i.vex.bytes[3] |= 0x10 | (i.rounding->type << 5);
3916 else
3917 i.vex.bytes[3] |= 0x10 | (evexrcig << 5);
3918 }
3919
3920 if (i.mask && i.mask->mask)
3921 i.vex.bytes[3] |= i.mask->mask->reg_num;
3922 }
3923
3924 static void
3925 process_immext (void)
3926 {
3927 expressionS *exp;
3928
3929 /* These AMD 3DNow! and SSE2 instructions have an opcode suffix
3930 which is coded in the same place as an 8-bit immediate field
3931 would be. Here we fake an 8-bit immediate operand from the
3932 opcode suffix stored in tm.extension_opcode.
3933
3934 AVX instructions also use this encoding, for some of
3935 3 argument instructions. */
3936
3937 gas_assert (i.imm_operands <= 1
3938 && (i.operands <= 2
3939 || (is_any_vex_encoding (&i.tm)
3940 && i.operands <= 4)));
3941
3942 exp = &im_expressions[i.imm_operands++];
3943 i.op[i.operands].imms = exp;
3944 i.types[i.operands] = imm8;
3945 i.operands++;
3946 exp->X_op = O_constant;
3947 exp->X_add_number = i.tm.extension_opcode;
3948 i.tm.extension_opcode = None;
3949 }
3950
3951
3952 static int
3953 check_hle (void)
3954 {
3955 switch (i.tm.opcode_modifier.hleprefixok)
3956 {
3957 default:
3958 abort ();
3959 case HLEPrefixNone:
3960 as_bad (_("invalid instruction `%s' after `%s'"),
3961 i.tm.name, i.hle_prefix);
3962 return 0;
3963 case HLEPrefixLock:
3964 if (i.prefix[LOCK_PREFIX])
3965 return 1;
3966 as_bad (_("missing `lock' with `%s'"), i.hle_prefix);
3967 return 0;
3968 case HLEPrefixAny:
3969 return 1;
3970 case HLEPrefixRelease:
3971 if (i.prefix[HLE_PREFIX] != XRELEASE_PREFIX_OPCODE)
3972 {
3973 as_bad (_("instruction `%s' after `xacquire' not allowed"),
3974 i.tm.name);
3975 return 0;
3976 }
3977 if (i.mem_operands == 0 || !(i.flags[i.operands - 1] & Operand_Mem))
3978 {
3979 as_bad (_("memory destination needed for instruction `%s'"
3980 " after `xrelease'"), i.tm.name);
3981 return 0;
3982 }
3983 return 1;
3984 }
3985 }
3986
3987 /* Try the shortest encoding by shortening operand size. */
3988
3989 static void
3990 optimize_encoding (void)
3991 {
3992 unsigned int j;
3993
3994 if (optimize_for_space
3995 && !is_any_vex_encoding (&i.tm)
3996 && i.reg_operands == 1
3997 && i.imm_operands == 1
3998 && !i.types[1].bitfield.byte
3999 && i.op[0].imms->X_op == O_constant
4000 && fits_in_imm7 (i.op[0].imms->X_add_number)
4001 && (i.tm.base_opcode == 0xa8
4002 || (i.tm.base_opcode == 0xf6
4003 && i.tm.extension_opcode == 0x0)))
4004 {
4005 /* Optimize: -Os:
4006 test $imm7, %r64/%r32/%r16 -> test $imm7, %r8
4007 */
4008 unsigned int base_regnum = i.op[1].regs->reg_num;
4009 if (flag_code == CODE_64BIT || base_regnum < 4)
4010 {
4011 i.types[1].bitfield.byte = 1;
4012 /* Ignore the suffix. */
4013 i.suffix = 0;
4014 /* Convert to byte registers. */
4015 if (i.types[1].bitfield.word)
4016 j = 16;
4017 else if (i.types[1].bitfield.dword)
4018 j = 32;
4019 else
4020 j = 48;
4021 if (!(i.op[1].regs->reg_flags & RegRex) && base_regnum < 4)
4022 j += 8;
4023 i.op[1].regs -= j;
4024 }
4025 }
4026 else if (flag_code == CODE_64BIT
4027 && !is_any_vex_encoding (&i.tm)
4028 && ((i.types[1].bitfield.qword
4029 && i.reg_operands == 1
4030 && i.imm_operands == 1
4031 && i.op[0].imms->X_op == O_constant
4032 && ((i.tm.base_opcode == 0xb8
4033 && i.tm.extension_opcode == None
4034 && fits_in_unsigned_long (i.op[0].imms->X_add_number))
4035 || (fits_in_imm31 (i.op[0].imms->X_add_number)
4036 && ((i.tm.base_opcode == 0x24
4037 || i.tm.base_opcode == 0xa8)
4038 || (i.tm.base_opcode == 0x80
4039 && i.tm.extension_opcode == 0x4)
4040 || ((i.tm.base_opcode == 0xf6
4041 || (i.tm.base_opcode | 1) == 0xc7)
4042 && i.tm.extension_opcode == 0x0)))
4043 || (fits_in_imm7 (i.op[0].imms->X_add_number)
4044 && i.tm.base_opcode == 0x83
4045 && i.tm.extension_opcode == 0x4)))
4046 || (i.types[0].bitfield.qword
4047 && ((i.reg_operands == 2
4048 && i.op[0].regs == i.op[1].regs
4049 && (i.tm.base_opcode == 0x30
4050 || i.tm.base_opcode == 0x28))
4051 || (i.reg_operands == 1
4052 && i.operands == 1
4053 && i.tm.base_opcode == 0x30)))))
4054 {
4055 /* Optimize: -O:
4056 andq $imm31, %r64 -> andl $imm31, %r32
4057 andq $imm7, %r64 -> andl $imm7, %r32
4058 testq $imm31, %r64 -> testl $imm31, %r32
4059 xorq %r64, %r64 -> xorl %r32, %r32
4060 subq %r64, %r64 -> subl %r32, %r32
4061 movq $imm31, %r64 -> movl $imm31, %r32
4062 movq $imm32, %r64 -> movl $imm32, %r32
4063 */
4064 i.tm.opcode_modifier.norex64 = 1;
4065 if (i.tm.base_opcode == 0xb8 || (i.tm.base_opcode | 1) == 0xc7)
4066 {
4067 /* Handle
4068 movq $imm31, %r64 -> movl $imm31, %r32
4069 movq $imm32, %r64 -> movl $imm32, %r32
4070 */
4071 i.tm.operand_types[0].bitfield.imm32 = 1;
4072 i.tm.operand_types[0].bitfield.imm32s = 0;
4073 i.tm.operand_types[0].bitfield.imm64 = 0;
4074 i.types[0].bitfield.imm32 = 1;
4075 i.types[0].bitfield.imm32s = 0;
4076 i.types[0].bitfield.imm64 = 0;
4077 i.types[1].bitfield.dword = 1;
4078 i.types[1].bitfield.qword = 0;
4079 if ((i.tm.base_opcode | 1) == 0xc7)
4080 {
4081 /* Handle
4082 movq $imm31, %r64 -> movl $imm31, %r32
4083 */
4084 i.tm.base_opcode = 0xb8;
4085 i.tm.extension_opcode = None;
4086 i.tm.opcode_modifier.w = 0;
4087 i.tm.opcode_modifier.modrm = 0;
4088 }
4089 }
4090 }
4091 else if (optimize > 1
4092 && !optimize_for_space
4093 && !is_any_vex_encoding (&i.tm)
4094 && i.reg_operands == 2
4095 && i.op[0].regs == i.op[1].regs
4096 && ((i.tm.base_opcode & ~(Opcode_D | 1)) == 0x8
4097 || (i.tm.base_opcode & ~(Opcode_D | 1)) == 0x20)
4098 && (flag_code != CODE_64BIT || !i.types[0].bitfield.dword))
4099 {
4100 /* Optimize: -O2:
4101 andb %rN, %rN -> testb %rN, %rN
4102 andw %rN, %rN -> testw %rN, %rN
4103 andq %rN, %rN -> testq %rN, %rN
4104 orb %rN, %rN -> testb %rN, %rN
4105 orw %rN, %rN -> testw %rN, %rN
4106 orq %rN, %rN -> testq %rN, %rN
4107
4108 and outside of 64-bit mode
4109
4110 andl %rN, %rN -> testl %rN, %rN
4111 orl %rN, %rN -> testl %rN, %rN
4112 */
4113 i.tm.base_opcode = 0x84 | (i.tm.base_opcode & 1);
4114 }
4115 else if (i.reg_operands == 3
4116 && i.op[0].regs == i.op[1].regs
4117 && !i.types[2].bitfield.xmmword
4118 && (i.tm.opcode_modifier.vex
4119 || ((!i.mask || i.mask->zeroing)
4120 && !i.rounding
4121 && is_evex_encoding (&i.tm)
4122 && (i.vec_encoding != vex_encoding_evex
4123 || cpu_arch_isa_flags.bitfield.cpuavx512vl
4124 || i.tm.cpu_flags.bitfield.cpuavx512vl
4125 || (i.tm.operand_types[2].bitfield.zmmword
4126 && i.types[2].bitfield.ymmword))))
4127 && ((i.tm.base_opcode == 0x55
4128 || i.tm.base_opcode == 0x6655
4129 || i.tm.base_opcode == 0x66df
4130 || i.tm.base_opcode == 0x57
4131 || i.tm.base_opcode == 0x6657
4132 || i.tm.base_opcode == 0x66ef
4133 || i.tm.base_opcode == 0x66f8
4134 || i.tm.base_opcode == 0x66f9
4135 || i.tm.base_opcode == 0x66fa
4136 || i.tm.base_opcode == 0x66fb
4137 || i.tm.base_opcode == 0x42
4138 || i.tm.base_opcode == 0x6642
4139 || i.tm.base_opcode == 0x47
4140 || i.tm.base_opcode == 0x6647)
4141 && i.tm.extension_opcode == None))
4142 {
4143 /* Optimize: -O1:
4144 VOP, one of vandnps, vandnpd, vxorps, vxorpd, vpsubb, vpsubd,
4145 vpsubq and vpsubw:
4146 EVEX VOP %zmmM, %zmmM, %zmmN
4147 -> VEX VOP %xmmM, %xmmM, %xmmN (M and N < 16)
4148 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4149 EVEX VOP %ymmM, %ymmM, %ymmN
4150 -> VEX VOP %xmmM, %xmmM, %xmmN (M and N < 16)
4151 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4152 VEX VOP %ymmM, %ymmM, %ymmN
4153 -> VEX VOP %xmmM, %xmmM, %xmmN
4154 VOP, one of vpandn and vpxor:
4155 VEX VOP %ymmM, %ymmM, %ymmN
4156 -> VEX VOP %xmmM, %xmmM, %xmmN
4157 VOP, one of vpandnd and vpandnq:
4158 EVEX VOP %zmmM, %zmmM, %zmmN
4159 -> VEX vpandn %xmmM, %xmmM, %xmmN (M and N < 16)
4160 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4161 EVEX VOP %ymmM, %ymmM, %ymmN
4162 -> VEX vpandn %xmmM, %xmmM, %xmmN (M and N < 16)
4163 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4164 VOP, one of vpxord and vpxorq:
4165 EVEX VOP %zmmM, %zmmM, %zmmN
4166 -> VEX vpxor %xmmM, %xmmM, %xmmN (M and N < 16)
4167 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4168 EVEX VOP %ymmM, %ymmM, %ymmN
4169 -> VEX vpxor %xmmM, %xmmM, %xmmN (M and N < 16)
4170 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4171 VOP, one of kxord and kxorq:
4172 VEX VOP %kM, %kM, %kN
4173 -> VEX kxorw %kM, %kM, %kN
4174 VOP, one of kandnd and kandnq:
4175 VEX VOP %kM, %kM, %kN
4176 -> VEX kandnw %kM, %kM, %kN
4177 */
4178 if (is_evex_encoding (&i.tm))
4179 {
4180 if (i.vec_encoding != vex_encoding_evex)
4181 {
4182 i.tm.opcode_modifier.vex = VEX128;
4183 i.tm.opcode_modifier.vexw = VEXW0;
4184 i.tm.opcode_modifier.evex = 0;
4185 }
4186 else if (optimize > 1)
4187 i.tm.opcode_modifier.evex = EVEX128;
4188 else
4189 return;
4190 }
4191 else if (i.tm.operand_types[0].bitfield.class == RegMask)
4192 {
4193 i.tm.base_opcode &= 0xff;
4194 i.tm.opcode_modifier.vexw = VEXW0;
4195 }
4196 else
4197 i.tm.opcode_modifier.vex = VEX128;
4198
4199 if (i.tm.opcode_modifier.vex)
4200 for (j = 0; j < 3; j++)
4201 {
4202 i.types[j].bitfield.xmmword = 1;
4203 i.types[j].bitfield.ymmword = 0;
4204 }
4205 }
4206 else if (i.vec_encoding != vex_encoding_evex
4207 && !i.types[0].bitfield.zmmword
4208 && !i.types[1].bitfield.zmmword
4209 && !i.mask
4210 && !i.broadcast
4211 && is_evex_encoding (&i.tm)
4212 && ((i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0x666f
4213 || (i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf36f
4214 || (i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf26f
4215 || (i.tm.base_opcode & ~4) == 0x66db
4216 || (i.tm.base_opcode & ~4) == 0x66eb)
4217 && i.tm.extension_opcode == None)
4218 {
4219 /* Optimize: -O1:
4220 VOP, one of vmovdqa32, vmovdqa64, vmovdqu8, vmovdqu16,
4221 vmovdqu32 and vmovdqu64:
4222 EVEX VOP %xmmM, %xmmN
4223 -> VEX vmovdqa|vmovdqu %xmmM, %xmmN (M and N < 16)
4224 EVEX VOP %ymmM, %ymmN
4225 -> VEX vmovdqa|vmovdqu %ymmM, %ymmN (M and N < 16)
4226 EVEX VOP %xmmM, mem
4227 -> VEX vmovdqa|vmovdqu %xmmM, mem (M < 16)
4228 EVEX VOP %ymmM, mem
4229 -> VEX vmovdqa|vmovdqu %ymmM, mem (M < 16)
4230 EVEX VOP mem, %xmmN
4231 -> VEX mvmovdqa|vmovdquem, %xmmN (N < 16)
4232 EVEX VOP mem, %ymmN
4233 -> VEX vmovdqa|vmovdqu mem, %ymmN (N < 16)
4234 VOP, one of vpand, vpandn, vpor, vpxor:
4235 EVEX VOP{d,q} %xmmL, %xmmM, %xmmN
4236 -> VEX VOP %xmmL, %xmmM, %xmmN (L, M, and N < 16)
4237 EVEX VOP{d,q} %ymmL, %ymmM, %ymmN
4238 -> VEX VOP %ymmL, %ymmM, %ymmN (L, M, and N < 16)
4239 EVEX VOP{d,q} mem, %xmmM, %xmmN
4240 -> VEX VOP mem, %xmmM, %xmmN (M and N < 16)
4241 EVEX VOP{d,q} mem, %ymmM, %ymmN
4242 -> VEX VOP mem, %ymmM, %ymmN (M and N < 16)
4243 */
4244 for (j = 0; j < i.operands; j++)
4245 if (operand_type_check (i.types[j], disp)
4246 && i.op[j].disps->X_op == O_constant)
4247 {
4248 /* Since the VEX prefix has 2 or 3 bytes, the EVEX prefix
4249 has 4 bytes, EVEX Disp8 has 1 byte and VEX Disp32 has 4
4250 bytes, we choose EVEX Disp8 over VEX Disp32. */
4251 int evex_disp8, vex_disp8;
4252 unsigned int memshift = i.memshift;
4253 offsetT n = i.op[j].disps->X_add_number;
4254
4255 evex_disp8 = fits_in_disp8 (n);
4256 i.memshift = 0;
4257 vex_disp8 = fits_in_disp8 (n);
4258 if (evex_disp8 != vex_disp8)
4259 {
4260 i.memshift = memshift;
4261 return;
4262 }
4263
4264 i.types[j].bitfield.disp8 = vex_disp8;
4265 break;
4266 }
4267 if ((i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf26f)
4268 i.tm.base_opcode ^= 0xf36f ^ 0xf26f;
4269 i.tm.opcode_modifier.vex
4270 = i.types[0].bitfield.ymmword ? VEX256 : VEX128;
4271 i.tm.opcode_modifier.vexw = VEXW0;
4272 /* VPAND, VPOR, and VPXOR are commutative. */
4273 if (i.reg_operands == 3 && i.tm.base_opcode != 0x66df)
4274 i.tm.opcode_modifier.commutative = 1;
4275 i.tm.opcode_modifier.evex = 0;
4276 i.tm.opcode_modifier.masking = 0;
4277 i.tm.opcode_modifier.broadcast = 0;
4278 i.tm.opcode_modifier.disp8memshift = 0;
4279 i.memshift = 0;
4280 if (j < i.operands)
4281 i.types[j].bitfield.disp8
4282 = fits_in_disp8 (i.op[j].disps->X_add_number);
4283 }
4284 }
4285
4286 /* This is the guts of the machine-dependent assembler. LINE points to a
4287 machine dependent instruction. This function is supposed to emit
4288 the frags/bytes it assembles to. */
4289
4290 void
4291 md_assemble (char *line)
4292 {
4293 unsigned int j;
4294 char mnemonic[MAX_MNEM_SIZE], mnem_suffix;
4295 const insn_template *t;
4296
4297 /* Initialize globals. */
4298 memset (&i, '\0', sizeof (i));
4299 for (j = 0; j < MAX_OPERANDS; j++)
4300 i.reloc[j] = NO_RELOC;
4301 memset (disp_expressions, '\0', sizeof (disp_expressions));
4302 memset (im_expressions, '\0', sizeof (im_expressions));
4303 save_stack_p = save_stack;
4304
4305 /* First parse an instruction mnemonic & call i386_operand for the operands.
4306 We assume that the scrubber has arranged it so that line[0] is the valid
4307 start of a (possibly prefixed) mnemonic. */
4308
4309 line = parse_insn (line, mnemonic);
4310 if (line == NULL)
4311 return;
4312 mnem_suffix = i.suffix;
4313
4314 line = parse_operands (line, mnemonic);
4315 this_operand = -1;
4316 xfree (i.memop1_string);
4317 i.memop1_string = NULL;
4318 if (line == NULL)
4319 return;
4320
4321 /* Now we've parsed the mnemonic into a set of templates, and have the
4322 operands at hand. */
4323
4324 /* All intel opcodes have reversed operands except for "bound" and
4325 "enter". We also don't reverse intersegment "jmp" and "call"
4326 instructions with 2 immediate operands so that the immediate segment
4327 precedes the offset, as it does when in AT&T mode. */
4328 if (intel_syntax
4329 && i.operands > 1
4330 && (strcmp (mnemonic, "bound") != 0)
4331 && (strcmp (mnemonic, "invlpga") != 0)
4332 && !(operand_type_check (i.types[0], imm)
4333 && operand_type_check (i.types[1], imm)))
4334 swap_operands ();
4335
4336 /* The order of the immediates should be reversed
4337 for 2 immediates extrq and insertq instructions */
4338 if (i.imm_operands == 2
4339 && (strcmp (mnemonic, "extrq") == 0
4340 || strcmp (mnemonic, "insertq") == 0))
4341 swap_2_operands (0, 1);
4342
4343 if (i.imm_operands)
4344 optimize_imm ();
4345
4346 /* Don't optimize displacement for movabs since it only takes 64bit
4347 displacement. */
4348 if (i.disp_operands
4349 && i.disp_encoding != disp_encoding_32bit
4350 && (flag_code != CODE_64BIT
4351 || strcmp (mnemonic, "movabs") != 0))
4352 optimize_disp ();
4353
4354 /* Next, we find a template that matches the given insn,
4355 making sure the overlap of the given operands types is consistent
4356 with the template operand types. */
4357
4358 if (!(t = match_template (mnem_suffix)))
4359 return;
4360
4361 if (sse_check != check_none
4362 && !i.tm.opcode_modifier.noavx
4363 && !i.tm.cpu_flags.bitfield.cpuavx
4364 && !i.tm.cpu_flags.bitfield.cpuavx512f
4365 && (i.tm.cpu_flags.bitfield.cpusse
4366 || i.tm.cpu_flags.bitfield.cpusse2
4367 || i.tm.cpu_flags.bitfield.cpusse3
4368 || i.tm.cpu_flags.bitfield.cpussse3
4369 || i.tm.cpu_flags.bitfield.cpusse4_1
4370 || i.tm.cpu_flags.bitfield.cpusse4_2
4371 || i.tm.cpu_flags.bitfield.cpusse4a
4372 || i.tm.cpu_flags.bitfield.cpupclmul
4373 || i.tm.cpu_flags.bitfield.cpuaes
4374 || i.tm.cpu_flags.bitfield.cpusha
4375 || i.tm.cpu_flags.bitfield.cpugfni))
4376 {
4377 (sse_check == check_warning
4378 ? as_warn
4379 : as_bad) (_("SSE instruction `%s' is used"), i.tm.name);
4380 }
4381
4382 /* Zap movzx and movsx suffix. The suffix has been set from
4383 "word ptr" or "byte ptr" on the source operand in Intel syntax
4384 or extracted from mnemonic in AT&T syntax. But we'll use
4385 the destination register to choose the suffix for encoding. */
4386 if ((i.tm.base_opcode & ~9) == 0x0fb6)
4387 {
4388 /* In Intel syntax, there must be a suffix. In AT&T syntax, if
4389 there is no suffix, the default will be byte extension. */
4390 if (i.reg_operands != 2
4391 && !i.suffix
4392 && intel_syntax)
4393 as_bad (_("ambiguous operand size for `%s'"), i.tm.name);
4394
4395 i.suffix = 0;
4396 }
4397
4398 if (i.tm.opcode_modifier.fwait)
4399 if (!add_prefix (FWAIT_OPCODE))
4400 return;
4401
4402 /* Check if REP prefix is OK. */
4403 if (i.rep_prefix && !i.tm.opcode_modifier.repprefixok)
4404 {
4405 as_bad (_("invalid instruction `%s' after `%s'"),
4406 i.tm.name, i.rep_prefix);
4407 return;
4408 }
4409
4410 /* Check for lock without a lockable instruction. Destination operand
4411 must be memory unless it is xchg (0x86). */
4412 if (i.prefix[LOCK_PREFIX]
4413 && (!i.tm.opcode_modifier.islockable
4414 || i.mem_operands == 0
4415 || (i.tm.base_opcode != 0x86
4416 && !(i.flags[i.operands - 1] & Operand_Mem))))
4417 {
4418 as_bad (_("expecting lockable instruction after `lock'"));
4419 return;
4420 }
4421
4422 /* Check for data size prefix on VEX/XOP/EVEX encoded insns. */
4423 if (i.prefix[DATA_PREFIX] && is_any_vex_encoding (&i.tm))
4424 {
4425 as_bad (_("data size prefix invalid with `%s'"), i.tm.name);
4426 return;
4427 }
4428
4429 /* Check if HLE prefix is OK. */
4430 if (i.hle_prefix && !check_hle ())
4431 return;
4432
4433 /* Check BND prefix. */
4434 if (i.bnd_prefix && !i.tm.opcode_modifier.bndprefixok)
4435 as_bad (_("expecting valid branch instruction after `bnd'"));
4436
4437 /* Check NOTRACK prefix. */
4438 if (i.notrack_prefix && !i.tm.opcode_modifier.notrackprefixok)
4439 as_bad (_("expecting indirect branch instruction after `notrack'"));
4440
4441 if (i.tm.cpu_flags.bitfield.cpumpx)
4442 {
4443 if (flag_code == CODE_64BIT && i.prefix[ADDR_PREFIX])
4444 as_bad (_("32-bit address isn't allowed in 64-bit MPX instructions."));
4445 else if (flag_code != CODE_16BIT
4446 ? i.prefix[ADDR_PREFIX]
4447 : i.mem_operands && !i.prefix[ADDR_PREFIX])
4448 as_bad (_("16-bit address isn't allowed in MPX instructions"));
4449 }
4450
4451 /* Insert BND prefix. */
4452 if (add_bnd_prefix && i.tm.opcode_modifier.bndprefixok)
4453 {
4454 if (!i.prefix[BND_PREFIX])
4455 add_prefix (BND_PREFIX_OPCODE);
4456 else if (i.prefix[BND_PREFIX] != BND_PREFIX_OPCODE)
4457 {
4458 as_warn (_("replacing `rep'/`repe' prefix by `bnd'"));
4459 i.prefix[BND_PREFIX] = BND_PREFIX_OPCODE;
4460 }
4461 }
4462
4463 /* Check string instruction segment overrides. */
4464 if (i.tm.opcode_modifier.isstring >= IS_STRING_ES_OP0)
4465 {
4466 gas_assert (i.mem_operands);
4467 if (!check_string ())
4468 return;
4469 i.disp_operands = 0;
4470 }
4471
4472 if (optimize && !i.no_optimize && i.tm.opcode_modifier.optimize)
4473 optimize_encoding ();
4474
4475 if (!process_suffix ())
4476 return;
4477
4478 /* Update operand types. */
4479 for (j = 0; j < i.operands; j++)
4480 i.types[j] = operand_type_and (i.types[j], i.tm.operand_types[j]);
4481
4482 /* Make still unresolved immediate matches conform to size of immediate
4483 given in i.suffix. */
4484 if (!finalize_imm ())
4485 return;
4486
4487 if (i.types[0].bitfield.imm1)
4488 i.imm_operands = 0; /* kludge for shift insns. */
4489
4490 /* We only need to check those implicit registers for instructions
4491 with 3 operands or less. */
4492 if (i.operands <= 3)
4493 for (j = 0; j < i.operands; j++)
4494 if (i.types[j].bitfield.instance != InstanceNone
4495 && !i.types[j].bitfield.xmmword)
4496 i.reg_operands--;
4497
4498 /* ImmExt should be processed after SSE2AVX. */
4499 if (!i.tm.opcode_modifier.sse2avx
4500 && i.tm.opcode_modifier.immext)
4501 process_immext ();
4502
4503 /* For insns with operands there are more diddles to do to the opcode. */
4504 if (i.operands)
4505 {
4506 if (!process_operands ())
4507 return;
4508 }
4509 else if (!quiet_warnings && i.tm.opcode_modifier.ugh)
4510 {
4511 /* UnixWare fsub no args is alias for fsubp, fadd -> faddp, etc. */
4512 as_warn (_("translating to `%sp'"), i.tm.name);
4513 }
4514
4515 if (is_any_vex_encoding (&i.tm))
4516 {
4517 if (!cpu_arch_flags.bitfield.cpui286)
4518 {
4519 as_bad (_("instruction `%s' isn't supported outside of protected mode."),
4520 i.tm.name);
4521 return;
4522 }
4523
4524 if (i.tm.opcode_modifier.vex)
4525 build_vex_prefix (t);
4526 else
4527 build_evex_prefix ();
4528 }
4529
4530 /* Handle conversion of 'int $3' --> special int3 insn. XOP or FMA4
4531 instructions may define INT_OPCODE as well, so avoid this corner
4532 case for those instructions that use MODRM. */
4533 if (i.tm.base_opcode == INT_OPCODE
4534 && !i.tm.opcode_modifier.modrm
4535 && i.op[0].imms->X_add_number == 3)
4536 {
4537 i.tm.base_opcode = INT3_OPCODE;
4538 i.imm_operands = 0;
4539 }
4540
4541 if ((i.tm.opcode_modifier.jump == JUMP
4542 || i.tm.opcode_modifier.jump == JUMP_BYTE
4543 || i.tm.opcode_modifier.jump == JUMP_DWORD)
4544 && i.op[0].disps->X_op == O_constant)
4545 {
4546 /* Convert "jmp constant" (and "call constant") to a jump (call) to
4547 the absolute address given by the constant. Since ix86 jumps and
4548 calls are pc relative, we need to generate a reloc. */
4549 i.op[0].disps->X_add_symbol = &abs_symbol;
4550 i.op[0].disps->X_op = O_symbol;
4551 }
4552
4553 if (i.tm.opcode_modifier.rex64)
4554 i.rex |= REX_W;
4555
4556 /* For 8 bit registers we need an empty rex prefix. Also if the
4557 instruction already has a prefix, we need to convert old
4558 registers to new ones. */
4559
4560 if ((i.types[0].bitfield.class == Reg && i.types[0].bitfield.byte
4561 && (i.op[0].regs->reg_flags & RegRex64) != 0)
4562 || (i.types[1].bitfield.class == Reg && i.types[1].bitfield.byte
4563 && (i.op[1].regs->reg_flags & RegRex64) != 0)
4564 || (((i.types[0].bitfield.class == Reg && i.types[0].bitfield.byte)
4565 || (i.types[1].bitfield.class == Reg && i.types[1].bitfield.byte))
4566 && i.rex != 0))
4567 {
4568 int x;
4569
4570 i.rex |= REX_OPCODE;
4571 for (x = 0; x < 2; x++)
4572 {
4573 /* Look for 8 bit operand that uses old registers. */
4574 if (i.types[x].bitfield.class == Reg && i.types[x].bitfield.byte
4575 && (i.op[x].regs->reg_flags & RegRex64) == 0)
4576 {
4577 gas_assert (!(i.op[x].regs->reg_flags & RegRex));
4578 /* In case it is "hi" register, give up. */
4579 if (i.op[x].regs->reg_num > 3)
4580 as_bad (_("can't encode register '%s%s' in an "
4581 "instruction requiring REX prefix."),
4582 register_prefix, i.op[x].regs->reg_name);
4583
4584 /* Otherwise it is equivalent to the extended register.
4585 Since the encoding doesn't change this is merely
4586 cosmetic cleanup for debug output. */
4587
4588 i.op[x].regs = i.op[x].regs + 8;
4589 }
4590 }
4591 }
4592
4593 if (i.rex == 0 && i.rex_encoding)
4594 {
4595 /* Check if we can add a REX_OPCODE byte. Look for 8 bit operand
4596 that uses legacy register. If it is "hi" register, don't add
4597 the REX_OPCODE byte. */
4598 int x;
4599 for (x = 0; x < 2; x++)
4600 if (i.types[x].bitfield.class == Reg
4601 && i.types[x].bitfield.byte
4602 && (i.op[x].regs->reg_flags & RegRex64) == 0
4603 && i.op[x].regs->reg_num > 3)
4604 {
4605 gas_assert (!(i.op[x].regs->reg_flags & RegRex));
4606 i.rex_encoding = FALSE;
4607 break;
4608 }
4609
4610 if (i.rex_encoding)
4611 i.rex = REX_OPCODE;
4612 }
4613
4614 if (i.rex != 0)
4615 add_prefix (REX_OPCODE | i.rex);
4616
4617 /* We are ready to output the insn. */
4618 output_insn ();
4619
4620 last_insn.seg = now_seg;
4621
4622 if (i.tm.opcode_modifier.isprefix)
4623 {
4624 last_insn.kind = last_insn_prefix;
4625 last_insn.name = i.tm.name;
4626 last_insn.file = as_where (&last_insn.line);
4627 }
4628 else
4629 last_insn.kind = last_insn_other;
4630 }
4631
4632 static char *
4633 parse_insn (char *line, char *mnemonic)
4634 {
4635 char *l = line;
4636 char *token_start = l;
4637 char *mnem_p;
4638 int supported;
4639 const insn_template *t;
4640 char *dot_p = NULL;
4641
4642 while (1)
4643 {
4644 mnem_p = mnemonic;
4645 while ((*mnem_p = mnemonic_chars[(unsigned char) *l]) != 0)
4646 {
4647 if (*mnem_p == '.')
4648 dot_p = mnem_p;
4649 mnem_p++;
4650 if (mnem_p >= mnemonic + MAX_MNEM_SIZE)
4651 {
4652 as_bad (_("no such instruction: `%s'"), token_start);
4653 return NULL;
4654 }
4655 l++;
4656 }
4657 if (!is_space_char (*l)
4658 && *l != END_OF_INSN
4659 && (intel_syntax
4660 || (*l != PREFIX_SEPARATOR
4661 && *l != ',')))
4662 {
4663 as_bad (_("invalid character %s in mnemonic"),
4664 output_invalid (*l));
4665 return NULL;
4666 }
4667 if (token_start == l)
4668 {
4669 if (!intel_syntax && *l == PREFIX_SEPARATOR)
4670 as_bad (_("expecting prefix; got nothing"));
4671 else
4672 as_bad (_("expecting mnemonic; got nothing"));
4673 return NULL;
4674 }
4675
4676 /* Look up instruction (or prefix) via hash table. */
4677 current_templates = (const templates *) hash_find (op_hash, mnemonic);
4678
4679 if (*l != END_OF_INSN
4680 && (!is_space_char (*l) || l[1] != END_OF_INSN)
4681 && current_templates
4682 && current_templates->start->opcode_modifier.isprefix)
4683 {
4684 if (!cpu_flags_check_cpu64 (current_templates->start->cpu_flags))
4685 {
4686 as_bad ((flag_code != CODE_64BIT
4687 ? _("`%s' is only supported in 64-bit mode")
4688 : _("`%s' is not supported in 64-bit mode")),
4689 current_templates->start->name);
4690 return NULL;
4691 }
4692 /* If we are in 16-bit mode, do not allow addr16 or data16.
4693 Similarly, in 32-bit mode, do not allow addr32 or data32. */
4694 if ((current_templates->start->opcode_modifier.size == SIZE16
4695 || current_templates->start->opcode_modifier.size == SIZE32)
4696 && flag_code != CODE_64BIT
4697 && ((current_templates->start->opcode_modifier.size == SIZE32)
4698 ^ (flag_code == CODE_16BIT)))
4699 {
4700 as_bad (_("redundant %s prefix"),
4701 current_templates->start->name);
4702 return NULL;
4703 }
4704 if (current_templates->start->opcode_length == 0)
4705 {
4706 /* Handle pseudo prefixes. */
4707 switch (current_templates->start->base_opcode)
4708 {
4709 case 0x0:
4710 /* {disp8} */
4711 i.disp_encoding = disp_encoding_8bit;
4712 break;
4713 case 0x1:
4714 /* {disp32} */
4715 i.disp_encoding = disp_encoding_32bit;
4716 break;
4717 case 0x2:
4718 /* {load} */
4719 i.dir_encoding = dir_encoding_load;
4720 break;
4721 case 0x3:
4722 /* {store} */
4723 i.dir_encoding = dir_encoding_store;
4724 break;
4725 case 0x4:
4726 /* {vex} */
4727 i.vec_encoding = vex_encoding_vex;
4728 break;
4729 case 0x5:
4730 /* {vex3} */
4731 i.vec_encoding = vex_encoding_vex3;
4732 break;
4733 case 0x6:
4734 /* {evex} */
4735 i.vec_encoding = vex_encoding_evex;
4736 break;
4737 case 0x7:
4738 /* {rex} */
4739 i.rex_encoding = TRUE;
4740 break;
4741 case 0x8:
4742 /* {nooptimize} */
4743 i.no_optimize = TRUE;
4744 break;
4745 default:
4746 abort ();
4747 }
4748 }
4749 else
4750 {
4751 /* Add prefix, checking for repeated prefixes. */
4752 switch (add_prefix (current_templates->start->base_opcode))
4753 {
4754 case PREFIX_EXIST:
4755 return NULL;
4756 case PREFIX_DS:
4757 if (current_templates->start->cpu_flags.bitfield.cpuibt)
4758 i.notrack_prefix = current_templates->start->name;
4759 break;
4760 case PREFIX_REP:
4761 if (current_templates->start->cpu_flags.bitfield.cpuhle)
4762 i.hle_prefix = current_templates->start->name;
4763 else if (current_templates->start->cpu_flags.bitfield.cpumpx)
4764 i.bnd_prefix = current_templates->start->name;
4765 else
4766 i.rep_prefix = current_templates->start->name;
4767 break;
4768 default:
4769 break;
4770 }
4771 }
4772 /* Skip past PREFIX_SEPARATOR and reset token_start. */
4773 token_start = ++l;
4774 }
4775 else
4776 break;
4777 }
4778
4779 if (!current_templates)
4780 {
4781 /* Deprecated functionality (new code should use pseudo-prefixes instead):
4782 Check if we should swap operand or force 32bit displacement in
4783 encoding. */
4784 if (mnem_p - 2 == dot_p && dot_p[1] == 's')
4785 i.dir_encoding = dir_encoding_swap;
4786 else if (mnem_p - 3 == dot_p
4787 && dot_p[1] == 'd'
4788 && dot_p[2] == '8')
4789 i.disp_encoding = disp_encoding_8bit;
4790 else if (mnem_p - 4 == dot_p
4791 && dot_p[1] == 'd'
4792 && dot_p[2] == '3'
4793 && dot_p[3] == '2')
4794 i.disp_encoding = disp_encoding_32bit;
4795 else
4796 goto check_suffix;
4797 mnem_p = dot_p;
4798 *dot_p = '\0';
4799 current_templates = (const templates *) hash_find (op_hash, mnemonic);
4800 }
4801
4802 if (!current_templates)
4803 {
4804 check_suffix:
4805 if (mnem_p > mnemonic)
4806 {
4807 /* See if we can get a match by trimming off a suffix. */
4808 switch (mnem_p[-1])
4809 {
4810 case WORD_MNEM_SUFFIX:
4811 if (intel_syntax && (intel_float_operand (mnemonic) & 2))
4812 i.suffix = SHORT_MNEM_SUFFIX;
4813 else
4814 /* Fall through. */
4815 case BYTE_MNEM_SUFFIX:
4816 case QWORD_MNEM_SUFFIX:
4817 i.suffix = mnem_p[-1];
4818 mnem_p[-1] = '\0';
4819 current_templates = (const templates *) hash_find (op_hash,
4820 mnemonic);
4821 break;
4822 case SHORT_MNEM_SUFFIX:
4823 case LONG_MNEM_SUFFIX:
4824 if (!intel_syntax)
4825 {
4826 i.suffix = mnem_p[-1];
4827 mnem_p[-1] = '\0';
4828 current_templates = (const templates *) hash_find (op_hash,
4829 mnemonic);
4830 }
4831 break;
4832
4833 /* Intel Syntax. */
4834 case 'd':
4835 if (intel_syntax)
4836 {
4837 if (intel_float_operand (mnemonic) == 1)
4838 i.suffix = SHORT_MNEM_SUFFIX;
4839 else
4840 i.suffix = LONG_MNEM_SUFFIX;
4841 mnem_p[-1] = '\0';
4842 current_templates = (const templates *) hash_find (op_hash,
4843 mnemonic);
4844 }
4845 break;
4846 }
4847 }
4848
4849 if (!current_templates)
4850 {
4851 as_bad (_("no such instruction: `%s'"), token_start);
4852 return NULL;
4853 }
4854 }
4855
4856 if (current_templates->start->opcode_modifier.jump == JUMP
4857 || current_templates->start->opcode_modifier.jump == JUMP_BYTE)
4858 {
4859 /* Check for a branch hint. We allow ",pt" and ",pn" for
4860 predict taken and predict not taken respectively.
4861 I'm not sure that branch hints actually do anything on loop
4862 and jcxz insns (JumpByte) for current Pentium4 chips. They
4863 may work in the future and it doesn't hurt to accept them
4864 now. */
4865 if (l[0] == ',' && l[1] == 'p')
4866 {
4867 if (l[2] == 't')
4868 {
4869 if (!add_prefix (DS_PREFIX_OPCODE))
4870 return NULL;
4871 l += 3;
4872 }
4873 else if (l[2] == 'n')
4874 {
4875 if (!add_prefix (CS_PREFIX_OPCODE))
4876 return NULL;
4877 l += 3;
4878 }
4879 }
4880 }
4881 /* Any other comma loses. */
4882 if (*l == ',')
4883 {
4884 as_bad (_("invalid character %s in mnemonic"),
4885 output_invalid (*l));
4886 return NULL;
4887 }
4888
4889 /* Check if instruction is supported on specified architecture. */
4890 supported = 0;
4891 for (t = current_templates->start; t < current_templates->end; ++t)
4892 {
4893 supported |= cpu_flags_match (t);
4894 if (supported == CPU_FLAGS_PERFECT_MATCH)
4895 {
4896 if (!cpu_arch_flags.bitfield.cpui386 && (flag_code != CODE_16BIT))
4897 as_warn (_("use .code16 to ensure correct addressing mode"));
4898
4899 return l;
4900 }
4901 }
4902
4903 if (!(supported & CPU_FLAGS_64BIT_MATCH))
4904 as_bad (flag_code == CODE_64BIT
4905 ? _("`%s' is not supported in 64-bit mode")
4906 : _("`%s' is only supported in 64-bit mode"),
4907 current_templates->start->name);
4908 else
4909 as_bad (_("`%s' is not supported on `%s%s'"),
4910 current_templates->start->name,
4911 cpu_arch_name ? cpu_arch_name : default_arch,
4912 cpu_sub_arch_name ? cpu_sub_arch_name : "");
4913
4914 return NULL;
4915 }
4916
4917 static char *
4918 parse_operands (char *l, const char *mnemonic)
4919 {
4920 char *token_start;
4921
4922 /* 1 if operand is pending after ','. */
4923 unsigned int expecting_operand = 0;
4924
4925 /* Non-zero if operand parens not balanced. */
4926 unsigned int paren_not_balanced;
4927
4928 while (*l != END_OF_INSN)
4929 {
4930 /* Skip optional white space before operand. */
4931 if (is_space_char (*l))
4932 ++l;
4933 if (!is_operand_char (*l) && *l != END_OF_INSN && *l != '"')
4934 {
4935 as_bad (_("invalid character %s before operand %d"),
4936 output_invalid (*l),
4937 i.operands + 1);
4938 return NULL;
4939 }
4940 token_start = l; /* After white space. */
4941 paren_not_balanced = 0;
4942 while (paren_not_balanced || *l != ',')
4943 {
4944 if (*l == END_OF_INSN)
4945 {
4946 if (paren_not_balanced)
4947 {
4948 if (!intel_syntax)
4949 as_bad (_("unbalanced parenthesis in operand %d."),
4950 i.operands + 1);
4951 else
4952 as_bad (_("unbalanced brackets in operand %d."),
4953 i.operands + 1);
4954 return NULL;
4955 }
4956 else
4957 break; /* we are done */
4958 }
4959 else if (!is_operand_char (*l) && !is_space_char (*l) && *l != '"')
4960 {
4961 as_bad (_("invalid character %s in operand %d"),
4962 output_invalid (*l),
4963 i.operands + 1);
4964 return NULL;
4965 }
4966 if (!intel_syntax)
4967 {
4968 if (*l == '(')
4969 ++paren_not_balanced;
4970 if (*l == ')')
4971 --paren_not_balanced;
4972 }
4973 else
4974 {
4975 if (*l == '[')
4976 ++paren_not_balanced;
4977 if (*l == ']')
4978 --paren_not_balanced;
4979 }
4980 l++;
4981 }
4982 if (l != token_start)
4983 { /* Yes, we've read in another operand. */
4984 unsigned int operand_ok;
4985 this_operand = i.operands++;
4986 if (i.operands > MAX_OPERANDS)
4987 {
4988 as_bad (_("spurious operands; (%d operands/instruction max)"),
4989 MAX_OPERANDS);
4990 return NULL;
4991 }
4992 i.types[this_operand].bitfield.unspecified = 1;
4993 /* Now parse operand adding info to 'i' as we go along. */
4994 END_STRING_AND_SAVE (l);
4995
4996 if (i.mem_operands > 1)
4997 {
4998 as_bad (_("too many memory references for `%s'"),
4999 mnemonic);
5000 return 0;
5001 }
5002
5003 if (intel_syntax)
5004 operand_ok =
5005 i386_intel_operand (token_start,
5006 intel_float_operand (mnemonic));
5007 else
5008 operand_ok = i386_att_operand (token_start);
5009
5010 RESTORE_END_STRING (l);
5011 if (!operand_ok)
5012 return NULL;
5013 }
5014 else
5015 {
5016 if (expecting_operand)
5017 {
5018 expecting_operand_after_comma:
5019 as_bad (_("expecting operand after ','; got nothing"));
5020 return NULL;
5021 }
5022 if (*l == ',')
5023 {
5024 as_bad (_("expecting operand before ','; got nothing"));
5025 return NULL;
5026 }
5027 }
5028
5029 /* Now *l must be either ',' or END_OF_INSN. */
5030 if (*l == ',')
5031 {
5032 if (*++l == END_OF_INSN)
5033 {
5034 /* Just skip it, if it's \n complain. */
5035 goto expecting_operand_after_comma;
5036 }
5037 expecting_operand = 1;
5038 }
5039 }
5040 return l;
5041 }
5042
5043 static void
5044 swap_2_operands (int xchg1, int xchg2)
5045 {
5046 union i386_op temp_op;
5047 i386_operand_type temp_type;
5048 unsigned int temp_flags;
5049 enum bfd_reloc_code_real temp_reloc;
5050
5051 temp_type = i.types[xchg2];
5052 i.types[xchg2] = i.types[xchg1];
5053 i.types[xchg1] = temp_type;
5054
5055 temp_flags = i.flags[xchg2];
5056 i.flags[xchg2] = i.flags[xchg1];
5057 i.flags[xchg1] = temp_flags;
5058
5059 temp_op = i.op[xchg2];
5060 i.op[xchg2] = i.op[xchg1];
5061 i.op[xchg1] = temp_op;
5062
5063 temp_reloc = i.reloc[xchg2];
5064 i.reloc[xchg2] = i.reloc[xchg1];
5065 i.reloc[xchg1] = temp_reloc;
5066
5067 if (i.mask)
5068 {
5069 if (i.mask->operand == xchg1)
5070 i.mask->operand = xchg2;
5071 else if (i.mask->operand == xchg2)
5072 i.mask->operand = xchg1;
5073 }
5074 if (i.broadcast)
5075 {
5076 if (i.broadcast->operand == xchg1)
5077 i.broadcast->operand = xchg2;
5078 else if (i.broadcast->operand == xchg2)
5079 i.broadcast->operand = xchg1;
5080 }
5081 if (i.rounding)
5082 {
5083 if (i.rounding->operand == xchg1)
5084 i.rounding->operand = xchg2;
5085 else if (i.rounding->operand == xchg2)
5086 i.rounding->operand = xchg1;
5087 }
5088 }
5089
5090 static void
5091 swap_operands (void)
5092 {
5093 switch (i.operands)
5094 {
5095 case 5:
5096 case 4:
5097 swap_2_operands (1, i.operands - 2);
5098 /* Fall through. */
5099 case 3:
5100 case 2:
5101 swap_2_operands (0, i.operands - 1);
5102 break;
5103 default:
5104 abort ();
5105 }
5106
5107 if (i.mem_operands == 2)
5108 {
5109 const seg_entry *temp_seg;
5110 temp_seg = i.seg[0];
5111 i.seg[0] = i.seg[1];
5112 i.seg[1] = temp_seg;
5113 }
5114 }
5115
5116 /* Try to ensure constant immediates are represented in the smallest
5117 opcode possible. */
5118 static void
5119 optimize_imm (void)
5120 {
5121 char guess_suffix = 0;
5122 int op;
5123
5124 if (i.suffix)
5125 guess_suffix = i.suffix;
5126 else if (i.reg_operands)
5127 {
5128 /* Figure out a suffix from the last register operand specified.
5129 We can't do this properly yet, i.e. excluding special register
5130 instances, but the following works for instructions with
5131 immediates. In any case, we can't set i.suffix yet. */
5132 for (op = i.operands; --op >= 0;)
5133 if (i.types[op].bitfield.class != Reg)
5134 continue;
5135 else if (i.types[op].bitfield.byte)
5136 {
5137 guess_suffix = BYTE_MNEM_SUFFIX;
5138 break;
5139 }
5140 else if (i.types[op].bitfield.word)
5141 {
5142 guess_suffix = WORD_MNEM_SUFFIX;
5143 break;
5144 }
5145 else if (i.types[op].bitfield.dword)
5146 {
5147 guess_suffix = LONG_MNEM_SUFFIX;
5148 break;
5149 }
5150 else if (i.types[op].bitfield.qword)
5151 {
5152 guess_suffix = QWORD_MNEM_SUFFIX;
5153 break;
5154 }
5155 }
5156 else if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
5157 guess_suffix = WORD_MNEM_SUFFIX;
5158
5159 for (op = i.operands; --op >= 0;)
5160 if (operand_type_check (i.types[op], imm))
5161 {
5162 switch (i.op[op].imms->X_op)
5163 {
5164 case O_constant:
5165 /* If a suffix is given, this operand may be shortened. */
5166 switch (guess_suffix)
5167 {
5168 case LONG_MNEM_SUFFIX:
5169 i.types[op].bitfield.imm32 = 1;
5170 i.types[op].bitfield.imm64 = 1;
5171 break;
5172 case WORD_MNEM_SUFFIX:
5173 i.types[op].bitfield.imm16 = 1;
5174 i.types[op].bitfield.imm32 = 1;
5175 i.types[op].bitfield.imm32s = 1;
5176 i.types[op].bitfield.imm64 = 1;
5177 break;
5178 case BYTE_MNEM_SUFFIX:
5179 i.types[op].bitfield.imm8 = 1;
5180 i.types[op].bitfield.imm8s = 1;
5181 i.types[op].bitfield.imm16 = 1;
5182 i.types[op].bitfield.imm32 = 1;
5183 i.types[op].bitfield.imm32s = 1;
5184 i.types[op].bitfield.imm64 = 1;
5185 break;
5186 }
5187
5188 /* If this operand is at most 16 bits, convert it
5189 to a signed 16 bit number before trying to see
5190 whether it will fit in an even smaller size.
5191 This allows a 16-bit operand such as $0xffe0 to
5192 be recognised as within Imm8S range. */
5193 if ((i.types[op].bitfield.imm16)
5194 && (i.op[op].imms->X_add_number & ~(offsetT) 0xffff) == 0)
5195 {
5196 i.op[op].imms->X_add_number =
5197 (((i.op[op].imms->X_add_number & 0xffff) ^ 0x8000) - 0x8000);
5198 }
5199 #ifdef BFD64
5200 /* Store 32-bit immediate in 64-bit for 64-bit BFD. */
5201 if ((i.types[op].bitfield.imm32)
5202 && ((i.op[op].imms->X_add_number & ~(((offsetT) 2 << 31) - 1))
5203 == 0))
5204 {
5205 i.op[op].imms->X_add_number = ((i.op[op].imms->X_add_number
5206 ^ ((offsetT) 1 << 31))
5207 - ((offsetT) 1 << 31));
5208 }
5209 #endif
5210 i.types[op]
5211 = operand_type_or (i.types[op],
5212 smallest_imm_type (i.op[op].imms->X_add_number));
5213
5214 /* We must avoid matching of Imm32 templates when 64bit
5215 only immediate is available. */
5216 if (guess_suffix == QWORD_MNEM_SUFFIX)
5217 i.types[op].bitfield.imm32 = 0;
5218 break;
5219
5220 case O_absent:
5221 case O_register:
5222 abort ();
5223
5224 /* Symbols and expressions. */
5225 default:
5226 /* Convert symbolic operand to proper sizes for matching, but don't
5227 prevent matching a set of insns that only supports sizes other
5228 than those matching the insn suffix. */
5229 {
5230 i386_operand_type mask, allowed;
5231 const insn_template *t;
5232
5233 operand_type_set (&mask, 0);
5234 operand_type_set (&allowed, 0);
5235
5236 for (t = current_templates->start;
5237 t < current_templates->end;
5238 ++t)
5239 {
5240 allowed = operand_type_or (allowed, t->operand_types[op]);
5241 allowed = operand_type_and (allowed, anyimm);
5242 }
5243 switch (guess_suffix)
5244 {
5245 case QWORD_MNEM_SUFFIX:
5246 mask.bitfield.imm64 = 1;
5247 mask.bitfield.imm32s = 1;
5248 break;
5249 case LONG_MNEM_SUFFIX:
5250 mask.bitfield.imm32 = 1;
5251 break;
5252 case WORD_MNEM_SUFFIX:
5253 mask.bitfield.imm16 = 1;
5254 break;
5255 case BYTE_MNEM_SUFFIX:
5256 mask.bitfield.imm8 = 1;
5257 break;
5258 default:
5259 break;
5260 }
5261 allowed = operand_type_and (mask, allowed);
5262 if (!operand_type_all_zero (&allowed))
5263 i.types[op] = operand_type_and (i.types[op], mask);
5264 }
5265 break;
5266 }
5267 }
5268 }
5269
5270 /* Try to use the smallest displacement type too. */
5271 static void
5272 optimize_disp (void)
5273 {
5274 int op;
5275
5276 for (op = i.operands; --op >= 0;)
5277 if (operand_type_check (i.types[op], disp))
5278 {
5279 if (i.op[op].disps->X_op == O_constant)
5280 {
5281 offsetT op_disp = i.op[op].disps->X_add_number;
5282
5283 if (i.types[op].bitfield.disp16
5284 && (op_disp & ~(offsetT) 0xffff) == 0)
5285 {
5286 /* If this operand is at most 16 bits, convert
5287 to a signed 16 bit number and don't use 64bit
5288 displacement. */
5289 op_disp = (((op_disp & 0xffff) ^ 0x8000) - 0x8000);
5290 i.types[op].bitfield.disp64 = 0;
5291 }
5292 #ifdef BFD64
5293 /* Optimize 64-bit displacement to 32-bit for 64-bit BFD. */
5294 if (i.types[op].bitfield.disp32
5295 && (op_disp & ~(((offsetT) 2 << 31) - 1)) == 0)
5296 {
5297 /* If this operand is at most 32 bits, convert
5298 to a signed 32 bit number and don't use 64bit
5299 displacement. */
5300 op_disp &= (((offsetT) 2 << 31) - 1);
5301 op_disp = (op_disp ^ ((offsetT) 1 << 31)) - ((addressT) 1 << 31);
5302 i.types[op].bitfield.disp64 = 0;
5303 }
5304 #endif
5305 if (!op_disp && i.types[op].bitfield.baseindex)
5306 {
5307 i.types[op].bitfield.disp8 = 0;
5308 i.types[op].bitfield.disp16 = 0;
5309 i.types[op].bitfield.disp32 = 0;
5310 i.types[op].bitfield.disp32s = 0;
5311 i.types[op].bitfield.disp64 = 0;
5312 i.op[op].disps = 0;
5313 i.disp_operands--;
5314 }
5315 else if (flag_code == CODE_64BIT)
5316 {
5317 if (fits_in_signed_long (op_disp))
5318 {
5319 i.types[op].bitfield.disp64 = 0;
5320 i.types[op].bitfield.disp32s = 1;
5321 }
5322 if (i.prefix[ADDR_PREFIX]
5323 && fits_in_unsigned_long (op_disp))
5324 i.types[op].bitfield.disp32 = 1;
5325 }
5326 if ((i.types[op].bitfield.disp32
5327 || i.types[op].bitfield.disp32s
5328 || i.types[op].bitfield.disp16)
5329 && fits_in_disp8 (op_disp))
5330 i.types[op].bitfield.disp8 = 1;
5331 }
5332 else if (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
5333 || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL)
5334 {
5335 fix_new_exp (frag_now, frag_more (0) - frag_now->fr_literal, 0,
5336 i.op[op].disps, 0, i.reloc[op]);
5337 i.types[op].bitfield.disp8 = 0;
5338 i.types[op].bitfield.disp16 = 0;
5339 i.types[op].bitfield.disp32 = 0;
5340 i.types[op].bitfield.disp32s = 0;
5341 i.types[op].bitfield.disp64 = 0;
5342 }
5343 else
5344 /* We only support 64bit displacement on constants. */
5345 i.types[op].bitfield.disp64 = 0;
5346 }
5347 }
5348
5349 /* Return 1 if there is a match in broadcast bytes between operand
5350 GIVEN and instruction template T. */
5351
5352 static INLINE int
5353 match_broadcast_size (const insn_template *t, unsigned int given)
5354 {
5355 return ((t->opcode_modifier.broadcast == BYTE_BROADCAST
5356 && i.types[given].bitfield.byte)
5357 || (t->opcode_modifier.broadcast == WORD_BROADCAST
5358 && i.types[given].bitfield.word)
5359 || (t->opcode_modifier.broadcast == DWORD_BROADCAST
5360 && i.types[given].bitfield.dword)
5361 || (t->opcode_modifier.broadcast == QWORD_BROADCAST
5362 && i.types[given].bitfield.qword));
5363 }
5364
5365 /* Check if operands are valid for the instruction. */
5366
5367 static int
5368 check_VecOperands (const insn_template *t)
5369 {
5370 unsigned int op;
5371 i386_cpu_flags cpu;
5372
5373 /* Templates allowing for ZMMword as well as YMMword and/or XMMword for
5374 any one operand are implicity requiring AVX512VL support if the actual
5375 operand size is YMMword or XMMword. Since this function runs after
5376 template matching, there's no need to check for YMMword/XMMword in
5377 the template. */
5378 cpu = cpu_flags_and (t->cpu_flags, avx512);
5379 if (!cpu_flags_all_zero (&cpu)
5380 && !t->cpu_flags.bitfield.cpuavx512vl
5381 && !cpu_arch_flags.bitfield.cpuavx512vl)
5382 {
5383 for (op = 0; op < t->operands; ++op)
5384 {
5385 if (t->operand_types[op].bitfield.zmmword
5386 && (i.types[op].bitfield.ymmword
5387 || i.types[op].bitfield.xmmword))
5388 {
5389 i.error = unsupported;
5390 return 1;
5391 }
5392 }
5393 }
5394
5395 /* Without VSIB byte, we can't have a vector register for index. */
5396 if (!t->opcode_modifier.vecsib
5397 && i.index_reg
5398 && (i.index_reg->reg_type.bitfield.xmmword
5399 || i.index_reg->reg_type.bitfield.ymmword
5400 || i.index_reg->reg_type.bitfield.zmmword))
5401 {
5402 i.error = unsupported_vector_index_register;
5403 return 1;
5404 }
5405
5406 /* Check if default mask is allowed. */
5407 if (t->opcode_modifier.nodefmask
5408 && (!i.mask || i.mask->mask->reg_num == 0))
5409 {
5410 i.error = no_default_mask;
5411 return 1;
5412 }
5413
5414 /* For VSIB byte, we need a vector register for index, and all vector
5415 registers must be distinct. */
5416 if (t->opcode_modifier.vecsib)
5417 {
5418 if (!i.index_reg
5419 || !((t->opcode_modifier.vecsib == VecSIB128
5420 && i.index_reg->reg_type.bitfield.xmmword)
5421 || (t->opcode_modifier.vecsib == VecSIB256
5422 && i.index_reg->reg_type.bitfield.ymmword)
5423 || (t->opcode_modifier.vecsib == VecSIB512
5424 && i.index_reg->reg_type.bitfield.zmmword)))
5425 {
5426 i.error = invalid_vsib_address;
5427 return 1;
5428 }
5429
5430 gas_assert (i.reg_operands == 2 || i.mask);
5431 if (i.reg_operands == 2 && !i.mask)
5432 {
5433 gas_assert (i.types[0].bitfield.class == RegSIMD);
5434 gas_assert (i.types[0].bitfield.xmmword
5435 || i.types[0].bitfield.ymmword);
5436 gas_assert (i.types[2].bitfield.class == RegSIMD);
5437 gas_assert (i.types[2].bitfield.xmmword
5438 || i.types[2].bitfield.ymmword);
5439 if (operand_check == check_none)
5440 return 0;
5441 if (register_number (i.op[0].regs)
5442 != register_number (i.index_reg)
5443 && register_number (i.op[2].regs)
5444 != register_number (i.index_reg)
5445 && register_number (i.op[0].regs)
5446 != register_number (i.op[2].regs))
5447 return 0;
5448 if (operand_check == check_error)
5449 {
5450 i.error = invalid_vector_register_set;
5451 return 1;
5452 }
5453 as_warn (_("mask, index, and destination registers should be distinct"));
5454 }
5455 else if (i.reg_operands == 1 && i.mask)
5456 {
5457 if (i.types[1].bitfield.class == RegSIMD
5458 && (i.types[1].bitfield.xmmword
5459 || i.types[1].bitfield.ymmword
5460 || i.types[1].bitfield.zmmword)
5461 && (register_number (i.op[1].regs)
5462 == register_number (i.index_reg)))
5463 {
5464 if (operand_check == check_error)
5465 {
5466 i.error = invalid_vector_register_set;
5467 return 1;
5468 }
5469 if (operand_check != check_none)
5470 as_warn (_("index and destination registers should be distinct"));
5471 }
5472 }
5473 }
5474
5475 /* Check if broadcast is supported by the instruction and is applied
5476 to the memory operand. */
5477 if (i.broadcast)
5478 {
5479 i386_operand_type type, overlap;
5480
5481 /* Check if specified broadcast is supported in this instruction,
5482 and its broadcast bytes match the memory operand. */
5483 op = i.broadcast->operand;
5484 if (!t->opcode_modifier.broadcast
5485 || !(i.flags[op] & Operand_Mem)
5486 || (!i.types[op].bitfield.unspecified
5487 && !match_broadcast_size (t, op)))
5488 {
5489 bad_broadcast:
5490 i.error = unsupported_broadcast;
5491 return 1;
5492 }
5493
5494 i.broadcast->bytes = ((1 << (t->opcode_modifier.broadcast - 1))
5495 * i.broadcast->type);
5496 operand_type_set (&type, 0);
5497 switch (i.broadcast->bytes)
5498 {
5499 case 2:
5500 type.bitfield.word = 1;
5501 break;
5502 case 4:
5503 type.bitfield.dword = 1;
5504 break;
5505 case 8:
5506 type.bitfield.qword = 1;
5507 break;
5508 case 16:
5509 type.bitfield.xmmword = 1;
5510 break;
5511 case 32:
5512 type.bitfield.ymmword = 1;
5513 break;
5514 case 64:
5515 type.bitfield.zmmword = 1;
5516 break;
5517 default:
5518 goto bad_broadcast;
5519 }
5520
5521 overlap = operand_type_and (type, t->operand_types[op]);
5522 if (operand_type_all_zero (&overlap))
5523 goto bad_broadcast;
5524
5525 if (t->opcode_modifier.checkregsize)
5526 {
5527 unsigned int j;
5528
5529 type.bitfield.baseindex = 1;
5530 for (j = 0; j < i.operands; ++j)
5531 {
5532 if (j != op
5533 && !operand_type_register_match(i.types[j],
5534 t->operand_types[j],
5535 type,
5536 t->operand_types[op]))
5537 goto bad_broadcast;
5538 }
5539 }
5540 }
5541 /* If broadcast is supported in this instruction, we need to check if
5542 operand of one-element size isn't specified without broadcast. */
5543 else if (t->opcode_modifier.broadcast && i.mem_operands)
5544 {
5545 /* Find memory operand. */
5546 for (op = 0; op < i.operands; op++)
5547 if (i.flags[op] & Operand_Mem)
5548 break;
5549 gas_assert (op < i.operands);
5550 /* Check size of the memory operand. */
5551 if (match_broadcast_size (t, op))
5552 {
5553 i.error = broadcast_needed;
5554 return 1;
5555 }
5556 }
5557 else
5558 op = MAX_OPERANDS - 1; /* Avoid uninitialized variable warning. */
5559
5560 /* Check if requested masking is supported. */
5561 if (i.mask)
5562 {
5563 switch (t->opcode_modifier.masking)
5564 {
5565 case BOTH_MASKING:
5566 break;
5567 case MERGING_MASKING:
5568 if (i.mask->zeroing)
5569 {
5570 case 0:
5571 i.error = unsupported_masking;
5572 return 1;
5573 }
5574 break;
5575 case DYNAMIC_MASKING:
5576 /* Memory destinations allow only merging masking. */
5577 if (i.mask->zeroing && i.mem_operands)
5578 {
5579 /* Find memory operand. */
5580 for (op = 0; op < i.operands; op++)
5581 if (i.flags[op] & Operand_Mem)
5582 break;
5583 gas_assert (op < i.operands);
5584 if (op == i.operands - 1)
5585 {
5586 i.error = unsupported_masking;
5587 return 1;
5588 }
5589 }
5590 break;
5591 default:
5592 abort ();
5593 }
5594 }
5595
5596 /* Check if masking is applied to dest operand. */
5597 if (i.mask && (i.mask->operand != (int) (i.operands - 1)))
5598 {
5599 i.error = mask_not_on_destination;
5600 return 1;
5601 }
5602
5603 /* Check RC/SAE. */
5604 if (i.rounding)
5605 {
5606 if (!t->opcode_modifier.sae
5607 || (i.rounding->type != saeonly && !t->opcode_modifier.staticrounding))
5608 {
5609 i.error = unsupported_rc_sae;
5610 return 1;
5611 }
5612 /* If the instruction has several immediate operands and one of
5613 them is rounding, the rounding operand should be the last
5614 immediate operand. */
5615 if (i.imm_operands > 1
5616 && i.rounding->operand != (int) (i.imm_operands - 1))
5617 {
5618 i.error = rc_sae_operand_not_last_imm;
5619 return 1;
5620 }
5621 }
5622
5623 /* Check vector Disp8 operand. */
5624 if (t->opcode_modifier.disp8memshift
5625 && i.disp_encoding != disp_encoding_32bit)
5626 {
5627 if (i.broadcast)
5628 i.memshift = t->opcode_modifier.broadcast - 1;
5629 else if (t->opcode_modifier.disp8memshift != DISP8_SHIFT_VL)
5630 i.memshift = t->opcode_modifier.disp8memshift;
5631 else
5632 {
5633 const i386_operand_type *type = NULL;
5634
5635 i.memshift = 0;
5636 for (op = 0; op < i.operands; op++)
5637 if (i.flags[op] & Operand_Mem)
5638 {
5639 if (t->opcode_modifier.evex == EVEXLIG)
5640 i.memshift = 2 + (i.suffix == QWORD_MNEM_SUFFIX);
5641 else if (t->operand_types[op].bitfield.xmmword
5642 + t->operand_types[op].bitfield.ymmword
5643 + t->operand_types[op].bitfield.zmmword <= 1)
5644 type = &t->operand_types[op];
5645 else if (!i.types[op].bitfield.unspecified)
5646 type = &i.types[op];
5647 }
5648 else if (i.types[op].bitfield.class == RegSIMD
5649 && t->opcode_modifier.evex != EVEXLIG)
5650 {
5651 if (i.types[op].bitfield.zmmword)
5652 i.memshift = 6;
5653 else if (i.types[op].bitfield.ymmword && i.memshift < 5)
5654 i.memshift = 5;
5655 else if (i.types[op].bitfield.xmmword && i.memshift < 4)
5656 i.memshift = 4;
5657 }
5658
5659 if (type)
5660 {
5661 if (type->bitfield.zmmword)
5662 i.memshift = 6;
5663 else if (type->bitfield.ymmword)
5664 i.memshift = 5;
5665 else if (type->bitfield.xmmword)
5666 i.memshift = 4;
5667 }
5668
5669 /* For the check in fits_in_disp8(). */
5670 if (i.memshift == 0)
5671 i.memshift = -1;
5672 }
5673
5674 for (op = 0; op < i.operands; op++)
5675 if (operand_type_check (i.types[op], disp)
5676 && i.op[op].disps->X_op == O_constant)
5677 {
5678 if (fits_in_disp8 (i.op[op].disps->X_add_number))
5679 {
5680 i.types[op].bitfield.disp8 = 1;
5681 return 0;
5682 }
5683 i.types[op].bitfield.disp8 = 0;
5684 }
5685 }
5686
5687 i.memshift = 0;
5688
5689 return 0;
5690 }
5691
5692 /* Check if operands are valid for the instruction. Update VEX
5693 operand types. */
5694
5695 static int
5696 VEX_check_operands (const insn_template *t)
5697 {
5698 if (i.vec_encoding == vex_encoding_evex)
5699 {
5700 /* This instruction must be encoded with EVEX prefix. */
5701 if (!is_evex_encoding (t))
5702 {
5703 i.error = unsupported;
5704 return 1;
5705 }
5706 return 0;
5707 }
5708
5709 if (!t->opcode_modifier.vex)
5710 {
5711 /* This instruction template doesn't have VEX prefix. */
5712 if (i.vec_encoding != vex_encoding_default)
5713 {
5714 i.error = unsupported;
5715 return 1;
5716 }
5717 return 0;
5718 }
5719
5720 /* Check the special Imm4 cases; must be the first operand. */
5721 if (t->cpu_flags.bitfield.cpuxop && t->operands == 5)
5722 {
5723 if (i.op[0].imms->X_op != O_constant
5724 || !fits_in_imm4 (i.op[0].imms->X_add_number))
5725 {
5726 i.error = bad_imm4;
5727 return 1;
5728 }
5729
5730 /* Turn off Imm<N> so that update_imm won't complain. */
5731 operand_type_set (&i.types[0], 0);
5732 }
5733
5734 return 0;
5735 }
5736
5737 static const insn_template *
5738 match_template (char mnem_suffix)
5739 {
5740 /* Points to template once we've found it. */
5741 const insn_template *t;
5742 i386_operand_type overlap0, overlap1, overlap2, overlap3;
5743 i386_operand_type overlap4;
5744 unsigned int found_reverse_match;
5745 i386_opcode_modifier suffix_check;
5746 i386_operand_type operand_types [MAX_OPERANDS];
5747 int addr_prefix_disp;
5748 unsigned int j, size_match, check_register;
5749 enum i386_error specific_error = 0;
5750
5751 #if MAX_OPERANDS != 5
5752 # error "MAX_OPERANDS must be 5."
5753 #endif
5754
5755 found_reverse_match = 0;
5756 addr_prefix_disp = -1;
5757
5758 /* Prepare for mnemonic suffix check. */
5759 memset (&suffix_check, 0, sizeof (suffix_check));
5760 switch (mnem_suffix)
5761 {
5762 case BYTE_MNEM_SUFFIX:
5763 suffix_check.no_bsuf = 1;
5764 break;
5765 case WORD_MNEM_SUFFIX:
5766 suffix_check.no_wsuf = 1;
5767 break;
5768 case SHORT_MNEM_SUFFIX:
5769 suffix_check.no_ssuf = 1;
5770 break;
5771 case LONG_MNEM_SUFFIX:
5772 suffix_check.no_lsuf = 1;
5773 break;
5774 case QWORD_MNEM_SUFFIX:
5775 suffix_check.no_qsuf = 1;
5776 break;
5777 default:
5778 /* NB: In Intel syntax, normally we can check for memory operand
5779 size when there is no mnemonic suffix. But jmp and call have
5780 2 different encodings with Dword memory operand size, one with
5781 No_ldSuf and the other without. i.suffix is set to
5782 LONG_DOUBLE_MNEM_SUFFIX to skip the one with No_ldSuf. */
5783 if (i.suffix == LONG_DOUBLE_MNEM_SUFFIX)
5784 suffix_check.no_ldsuf = 1;
5785 }
5786
5787 /* Must have right number of operands. */
5788 i.error = number_of_operands_mismatch;
5789
5790 for (t = current_templates->start; t < current_templates->end; t++)
5791 {
5792 addr_prefix_disp = -1;
5793 found_reverse_match = 0;
5794
5795 if (i.operands != t->operands)
5796 continue;
5797
5798 /* Check processor support. */
5799 i.error = unsupported;
5800 if (cpu_flags_match (t) != CPU_FLAGS_PERFECT_MATCH)
5801 continue;
5802
5803 /* Check AT&T mnemonic. */
5804 i.error = unsupported_with_intel_mnemonic;
5805 if (intel_mnemonic && t->opcode_modifier.attmnemonic)
5806 continue;
5807
5808 /* Check AT&T/Intel syntax. */
5809 i.error = unsupported_syntax;
5810 if ((intel_syntax && t->opcode_modifier.attsyntax)
5811 || (!intel_syntax && t->opcode_modifier.intelsyntax))
5812 continue;
5813
5814 /* Check Intel64/AMD64 ISA. */
5815 switch (isa64)
5816 {
5817 default:
5818 /* Default: Don't accept Intel64. */
5819 if (t->opcode_modifier.isa64 == INTEL64)
5820 continue;
5821 break;
5822 case amd64:
5823 /* -mamd64: Don't accept Intel64 and Intel64 only. */
5824 if (t->opcode_modifier.isa64 >= INTEL64)
5825 continue;
5826 break;
5827 case intel64:
5828 /* -mintel64: Don't accept AMD64. */
5829 if (t->opcode_modifier.isa64 == AMD64 && flag_code == CODE_64BIT)
5830 continue;
5831 break;
5832 }
5833
5834 /* Check the suffix. */
5835 i.error = invalid_instruction_suffix;
5836 if ((t->opcode_modifier.no_bsuf && suffix_check.no_bsuf)
5837 || (t->opcode_modifier.no_wsuf && suffix_check.no_wsuf)
5838 || (t->opcode_modifier.no_lsuf && suffix_check.no_lsuf)
5839 || (t->opcode_modifier.no_ssuf && suffix_check.no_ssuf)
5840 || (t->opcode_modifier.no_qsuf && suffix_check.no_qsuf)
5841 || (t->opcode_modifier.no_ldsuf && suffix_check.no_ldsuf))
5842 continue;
5843
5844 size_match = operand_size_match (t);
5845 if (!size_match)
5846 continue;
5847
5848 /* This is intentionally not
5849
5850 if (i.jumpabsolute != (t->opcode_modifier.jump == JUMP_ABSOLUTE))
5851
5852 as the case of a missing * on the operand is accepted (perhaps with
5853 a warning, issued further down). */
5854 if (i.jumpabsolute && t->opcode_modifier.jump != JUMP_ABSOLUTE)
5855 {
5856 i.error = operand_type_mismatch;
5857 continue;
5858 }
5859
5860 for (j = 0; j < MAX_OPERANDS; j++)
5861 operand_types[j] = t->operand_types[j];
5862
5863 /* In general, don't allow 64-bit operands in 32-bit mode. */
5864 if (i.suffix == QWORD_MNEM_SUFFIX
5865 && flag_code != CODE_64BIT
5866 && (intel_syntax
5867 ? (!t->opcode_modifier.ignoresize
5868 && !t->opcode_modifier.broadcast
5869 && !intel_float_operand (t->name))
5870 : intel_float_operand (t->name) != 2)
5871 && ((operand_types[0].bitfield.class != RegMMX
5872 && operand_types[0].bitfield.class != RegSIMD)
5873 || (operand_types[t->operands > 1].bitfield.class != RegMMX
5874 && operand_types[t->operands > 1].bitfield.class != RegSIMD))
5875 && (t->base_opcode != 0x0fc7
5876 || t->extension_opcode != 1 /* cmpxchg8b */))
5877 continue;
5878
5879 /* In general, don't allow 32-bit operands on pre-386. */
5880 else if (i.suffix == LONG_MNEM_SUFFIX
5881 && !cpu_arch_flags.bitfield.cpui386
5882 && (intel_syntax
5883 ? (!t->opcode_modifier.ignoresize
5884 && !intel_float_operand (t->name))
5885 : intel_float_operand (t->name) != 2)
5886 && ((operand_types[0].bitfield.class != RegMMX
5887 && operand_types[0].bitfield.class != RegSIMD)
5888 || (operand_types[t->operands > 1].bitfield.class != RegMMX
5889 && operand_types[t->operands > 1].bitfield.class
5890 != RegSIMD)))
5891 continue;
5892
5893 /* Do not verify operands when there are none. */
5894 else
5895 {
5896 if (!t->operands)
5897 /* We've found a match; break out of loop. */
5898 break;
5899 }
5900
5901 if (!t->opcode_modifier.jump
5902 || t->opcode_modifier.jump == JUMP_ABSOLUTE)
5903 {
5904 /* There should be only one Disp operand. */
5905 for (j = 0; j < MAX_OPERANDS; j++)
5906 if (operand_type_check (operand_types[j], disp))
5907 break;
5908 if (j < MAX_OPERANDS)
5909 {
5910 bfd_boolean override = (i.prefix[ADDR_PREFIX] != 0);
5911
5912 addr_prefix_disp = j;
5913
5914 /* Address size prefix will turn Disp64/Disp32S/Disp32/Disp16
5915 operand into Disp32/Disp32/Disp16/Disp32 operand. */
5916 switch (flag_code)
5917 {
5918 case CODE_16BIT:
5919 override = !override;
5920 /* Fall through. */
5921 case CODE_32BIT:
5922 if (operand_types[j].bitfield.disp32
5923 && operand_types[j].bitfield.disp16)
5924 {
5925 operand_types[j].bitfield.disp16 = override;
5926 operand_types[j].bitfield.disp32 = !override;
5927 }
5928 operand_types[j].bitfield.disp32s = 0;
5929 operand_types[j].bitfield.disp64 = 0;
5930 break;
5931
5932 case CODE_64BIT:
5933 if (operand_types[j].bitfield.disp32s
5934 || operand_types[j].bitfield.disp64)
5935 {
5936 operand_types[j].bitfield.disp64 &= !override;
5937 operand_types[j].bitfield.disp32s &= !override;
5938 operand_types[j].bitfield.disp32 = override;
5939 }
5940 operand_types[j].bitfield.disp16 = 0;
5941 break;
5942 }
5943 }
5944 }
5945
5946 /* Force 0x8b encoding for "mov foo@GOT, %eax". */
5947 if (i.reloc[0] == BFD_RELOC_386_GOT32 && t->base_opcode == 0xa0)
5948 continue;
5949
5950 /* We check register size if needed. */
5951 if (t->opcode_modifier.checkregsize)
5952 {
5953 check_register = (1 << t->operands) - 1;
5954 if (i.broadcast)
5955 check_register &= ~(1 << i.broadcast->operand);
5956 }
5957 else
5958 check_register = 0;
5959
5960 overlap0 = operand_type_and (i.types[0], operand_types[0]);
5961 switch (t->operands)
5962 {
5963 case 1:
5964 if (!operand_type_match (overlap0, i.types[0]))
5965 continue;
5966 break;
5967 case 2:
5968 /* xchg %eax, %eax is a special case. It is an alias for nop
5969 only in 32bit mode and we can use opcode 0x90. In 64bit
5970 mode, we can't use 0x90 for xchg %eax, %eax since it should
5971 zero-extend %eax to %rax. */
5972 if (flag_code == CODE_64BIT
5973 && t->base_opcode == 0x90
5974 && i.types[0].bitfield.instance == Accum
5975 && i.types[0].bitfield.dword
5976 && i.types[1].bitfield.instance == Accum
5977 && i.types[1].bitfield.dword)
5978 continue;
5979 /* xrelease mov %eax, <disp> is another special case. It must not
5980 match the accumulator-only encoding of mov. */
5981 if (flag_code != CODE_64BIT
5982 && i.hle_prefix
5983 && t->base_opcode == 0xa0
5984 && i.types[0].bitfield.instance == Accum
5985 && (i.flags[1] & Operand_Mem))
5986 continue;
5987 /* Fall through. */
5988
5989 case 3:
5990 if (!(size_match & MATCH_STRAIGHT))
5991 goto check_reverse;
5992 /* Reverse direction of operands if swapping is possible in the first
5993 place (operands need to be symmetric) and
5994 - the load form is requested, and the template is a store form,
5995 - the store form is requested, and the template is a load form,
5996 - the non-default (swapped) form is requested. */
5997 overlap1 = operand_type_and (operand_types[0], operand_types[1]);
5998 if (t->opcode_modifier.d && i.reg_operands == i.operands
5999 && !operand_type_all_zero (&overlap1))
6000 switch (i.dir_encoding)
6001 {
6002 case dir_encoding_load:
6003 if (operand_type_check (operand_types[i.operands - 1], anymem)
6004 || t->opcode_modifier.regmem)
6005 goto check_reverse;
6006 break;
6007
6008 case dir_encoding_store:
6009 if (!operand_type_check (operand_types[i.operands - 1], anymem)
6010 && !t->opcode_modifier.regmem)
6011 goto check_reverse;
6012 break;
6013
6014 case dir_encoding_swap:
6015 goto check_reverse;
6016
6017 case dir_encoding_default:
6018 break;
6019 }
6020 /* If we want store form, we skip the current load. */
6021 if ((i.dir_encoding == dir_encoding_store
6022 || i.dir_encoding == dir_encoding_swap)
6023 && i.mem_operands == 0
6024 && t->opcode_modifier.load)
6025 continue;
6026 /* Fall through. */
6027 case 4:
6028 case 5:
6029 overlap1 = operand_type_and (i.types[1], operand_types[1]);
6030 if (!operand_type_match (overlap0, i.types[0])
6031 || !operand_type_match (overlap1, i.types[1])
6032 || ((check_register & 3) == 3
6033 && !operand_type_register_match (i.types[0],
6034 operand_types[0],
6035 i.types[1],
6036 operand_types[1])))
6037 {
6038 /* Check if other direction is valid ... */
6039 if (!t->opcode_modifier.d)
6040 continue;
6041
6042 check_reverse:
6043 if (!(size_match & MATCH_REVERSE))
6044 continue;
6045 /* Try reversing direction of operands. */
6046 overlap0 = operand_type_and (i.types[0], operand_types[i.operands - 1]);
6047 overlap1 = operand_type_and (i.types[i.operands - 1], operand_types[0]);
6048 if (!operand_type_match (overlap0, i.types[0])
6049 || !operand_type_match (overlap1, i.types[i.operands - 1])
6050 || (check_register
6051 && !operand_type_register_match (i.types[0],
6052 operand_types[i.operands - 1],
6053 i.types[i.operands - 1],
6054 operand_types[0])))
6055 {
6056 /* Does not match either direction. */
6057 continue;
6058 }
6059 /* found_reverse_match holds which of D or FloatR
6060 we've found. */
6061 if (!t->opcode_modifier.d)
6062 found_reverse_match = 0;
6063 else if (operand_types[0].bitfield.tbyte)
6064 found_reverse_match = Opcode_FloatD;
6065 else if (operand_types[0].bitfield.xmmword
6066 || operand_types[i.operands - 1].bitfield.xmmword
6067 || operand_types[0].bitfield.class == RegMMX
6068 || operand_types[i.operands - 1].bitfield.class == RegMMX
6069 || is_any_vex_encoding(t))
6070 found_reverse_match = (t->base_opcode & 0xee) != 0x6e
6071 ? Opcode_SIMD_FloatD : Opcode_SIMD_IntD;
6072 else
6073 found_reverse_match = Opcode_D;
6074 if (t->opcode_modifier.floatr)
6075 found_reverse_match |= Opcode_FloatR;
6076 }
6077 else
6078 {
6079 /* Found a forward 2 operand match here. */
6080 switch (t->operands)
6081 {
6082 case 5:
6083 overlap4 = operand_type_and (i.types[4],
6084 operand_types[4]);
6085 /* Fall through. */
6086 case 4:
6087 overlap3 = operand_type_and (i.types[3],
6088 operand_types[3]);
6089 /* Fall through. */
6090 case 3:
6091 overlap2 = operand_type_and (i.types[2],
6092 operand_types[2]);
6093 break;
6094 }
6095
6096 switch (t->operands)
6097 {
6098 case 5:
6099 if (!operand_type_match (overlap4, i.types[4])
6100 || !operand_type_register_match (i.types[3],
6101 operand_types[3],
6102 i.types[4],
6103 operand_types[4]))
6104 continue;
6105 /* Fall through. */
6106 case 4:
6107 if (!operand_type_match (overlap3, i.types[3])
6108 || ((check_register & 0xa) == 0xa
6109 && !operand_type_register_match (i.types[1],
6110 operand_types[1],
6111 i.types[3],
6112 operand_types[3]))
6113 || ((check_register & 0xc) == 0xc
6114 && !operand_type_register_match (i.types[2],
6115 operand_types[2],
6116 i.types[3],
6117 operand_types[3])))
6118 continue;
6119 /* Fall through. */
6120 case 3:
6121 /* Here we make use of the fact that there are no
6122 reverse match 3 operand instructions. */
6123 if (!operand_type_match (overlap2, i.types[2])
6124 || ((check_register & 5) == 5
6125 && !operand_type_register_match (i.types[0],
6126 operand_types[0],
6127 i.types[2],
6128 operand_types[2]))
6129 || ((check_register & 6) == 6
6130 && !operand_type_register_match (i.types[1],
6131 operand_types[1],
6132 i.types[2],
6133 operand_types[2])))
6134 continue;
6135 break;
6136 }
6137 }
6138 /* Found either forward/reverse 2, 3 or 4 operand match here:
6139 slip through to break. */
6140 }
6141
6142 /* Check if vector and VEX operands are valid. */
6143 if (check_VecOperands (t) || VEX_check_operands (t))
6144 {
6145 specific_error = i.error;
6146 continue;
6147 }
6148
6149 /* We've found a match; break out of loop. */
6150 break;
6151 }
6152
6153 if (t == current_templates->end)
6154 {
6155 /* We found no match. */
6156 const char *err_msg;
6157 switch (specific_error ? specific_error : i.error)
6158 {
6159 default:
6160 abort ();
6161 case operand_size_mismatch:
6162 err_msg = _("operand size mismatch");
6163 break;
6164 case operand_type_mismatch:
6165 err_msg = _("operand type mismatch");
6166 break;
6167 case register_type_mismatch:
6168 err_msg = _("register type mismatch");
6169 break;
6170 case number_of_operands_mismatch:
6171 err_msg = _("number of operands mismatch");
6172 break;
6173 case invalid_instruction_suffix:
6174 err_msg = _("invalid instruction suffix");
6175 break;
6176 case bad_imm4:
6177 err_msg = _("constant doesn't fit in 4 bits");
6178 break;
6179 case unsupported_with_intel_mnemonic:
6180 err_msg = _("unsupported with Intel mnemonic");
6181 break;
6182 case unsupported_syntax:
6183 err_msg = _("unsupported syntax");
6184 break;
6185 case unsupported:
6186 as_bad (_("unsupported instruction `%s'"),
6187 current_templates->start->name);
6188 return NULL;
6189 case invalid_vsib_address:
6190 err_msg = _("invalid VSIB address");
6191 break;
6192 case invalid_vector_register_set:
6193 err_msg = _("mask, index, and destination registers must be distinct");
6194 break;
6195 case unsupported_vector_index_register:
6196 err_msg = _("unsupported vector index register");
6197 break;
6198 case unsupported_broadcast:
6199 err_msg = _("unsupported broadcast");
6200 break;
6201 case broadcast_needed:
6202 err_msg = _("broadcast is needed for operand of such type");
6203 break;
6204 case unsupported_masking:
6205 err_msg = _("unsupported masking");
6206 break;
6207 case mask_not_on_destination:
6208 err_msg = _("mask not on destination operand");
6209 break;
6210 case no_default_mask:
6211 err_msg = _("default mask isn't allowed");
6212 break;
6213 case unsupported_rc_sae:
6214 err_msg = _("unsupported static rounding/sae");
6215 break;
6216 case rc_sae_operand_not_last_imm:
6217 if (intel_syntax)
6218 err_msg = _("RC/SAE operand must precede immediate operands");
6219 else
6220 err_msg = _("RC/SAE operand must follow immediate operands");
6221 break;
6222 case invalid_register_operand:
6223 err_msg = _("invalid register operand");
6224 break;
6225 }
6226 as_bad (_("%s for `%s'"), err_msg,
6227 current_templates->start->name);
6228 return NULL;
6229 }
6230
6231 if (!quiet_warnings)
6232 {
6233 if (!intel_syntax
6234 && (i.jumpabsolute != (t->opcode_modifier.jump == JUMP_ABSOLUTE)))
6235 as_warn (_("indirect %s without `*'"), t->name);
6236
6237 if (t->opcode_modifier.isprefix
6238 && t->opcode_modifier.ignoresize)
6239 {
6240 /* Warn them that a data or address size prefix doesn't
6241 affect assembly of the next line of code. */
6242 as_warn (_("stand-alone `%s' prefix"), t->name);
6243 }
6244 }
6245
6246 /* Copy the template we found. */
6247 i.tm = *t;
6248
6249 if (addr_prefix_disp != -1)
6250 i.tm.operand_types[addr_prefix_disp]
6251 = operand_types[addr_prefix_disp];
6252
6253 if (found_reverse_match)
6254 {
6255 /* If we found a reverse match we must alter the opcode direction
6256 bit and clear/flip the regmem modifier one. found_reverse_match
6257 holds bits to change (different for int & float insns). */
6258
6259 i.tm.base_opcode ^= found_reverse_match;
6260
6261 i.tm.operand_types[0] = operand_types[i.operands - 1];
6262 i.tm.operand_types[i.operands - 1] = operand_types[0];
6263
6264 /* Certain SIMD insns have their load forms specified in the opcode
6265 table, and hence we need to _set_ RegMem instead of clearing it.
6266 We need to avoid setting the bit though on insns like KMOVW. */
6267 i.tm.opcode_modifier.regmem
6268 = i.tm.opcode_modifier.modrm && i.tm.opcode_modifier.d
6269 && i.tm.operands > 2U - i.tm.opcode_modifier.sse2avx
6270 && !i.tm.opcode_modifier.regmem;
6271 }
6272
6273 return t;
6274 }
6275
6276 static int
6277 check_string (void)
6278 {
6279 unsigned int es_op = i.tm.opcode_modifier.isstring - IS_STRING_ES_OP0;
6280 unsigned int op = i.tm.operand_types[0].bitfield.baseindex ? es_op : 0;
6281
6282 if (i.seg[op] != NULL && i.seg[op] != &es)
6283 {
6284 as_bad (_("`%s' operand %u must use `%ses' segment"),
6285 i.tm.name,
6286 intel_syntax ? i.tm.operands - es_op : es_op + 1,
6287 register_prefix);
6288 return 0;
6289 }
6290
6291 /* There's only ever one segment override allowed per instruction.
6292 This instruction possibly has a legal segment override on the
6293 second operand, so copy the segment to where non-string
6294 instructions store it, allowing common code. */
6295 i.seg[op] = i.seg[1];
6296
6297 return 1;
6298 }
6299
6300 static int
6301 process_suffix (void)
6302 {
6303 /* If matched instruction specifies an explicit instruction mnemonic
6304 suffix, use it. */
6305 if (i.tm.opcode_modifier.size == SIZE16)
6306 i.suffix = WORD_MNEM_SUFFIX;
6307 else if (i.tm.opcode_modifier.size == SIZE32)
6308 i.suffix = LONG_MNEM_SUFFIX;
6309 else if (i.tm.opcode_modifier.size == SIZE64)
6310 i.suffix = QWORD_MNEM_SUFFIX;
6311 else if (i.reg_operands
6312 && (i.operands > 1 || i.types[0].bitfield.class == Reg))
6313 {
6314 /* If there's no instruction mnemonic suffix we try to invent one
6315 based on GPR operands. */
6316 if (!i.suffix)
6317 {
6318 /* We take i.suffix from the last register operand specified,
6319 Destination register type is more significant than source
6320 register type. crc32 in SSE4.2 prefers source register
6321 type. */
6322 unsigned int op = i.tm.base_opcode != 0xf20f38f0 ? i.operands : 1;
6323
6324 while (op--)
6325 if (i.tm.operand_types[op].bitfield.instance == InstanceNone
6326 || i.tm.operand_types[op].bitfield.instance == Accum)
6327 {
6328 if (i.types[op].bitfield.class != Reg)
6329 continue;
6330 if (i.types[op].bitfield.byte)
6331 i.suffix = BYTE_MNEM_SUFFIX;
6332 else if (i.types[op].bitfield.word)
6333 i.suffix = WORD_MNEM_SUFFIX;
6334 else if (i.types[op].bitfield.dword)
6335 i.suffix = LONG_MNEM_SUFFIX;
6336 else if (i.types[op].bitfield.qword)
6337 i.suffix = QWORD_MNEM_SUFFIX;
6338 else
6339 continue;
6340 break;
6341 }
6342 }
6343 else if (i.suffix == BYTE_MNEM_SUFFIX)
6344 {
6345 if (intel_syntax
6346 && i.tm.opcode_modifier.ignoresize
6347 && i.tm.opcode_modifier.no_bsuf)
6348 i.suffix = 0;
6349 else if (!check_byte_reg ())
6350 return 0;
6351 }
6352 else if (i.suffix == LONG_MNEM_SUFFIX)
6353 {
6354 if (intel_syntax
6355 && i.tm.opcode_modifier.ignoresize
6356 && i.tm.opcode_modifier.no_lsuf
6357 && !i.tm.opcode_modifier.todword
6358 && !i.tm.opcode_modifier.toqword)
6359 i.suffix = 0;
6360 else if (!check_long_reg ())
6361 return 0;
6362 }
6363 else if (i.suffix == QWORD_MNEM_SUFFIX)
6364 {
6365 if (intel_syntax
6366 && i.tm.opcode_modifier.ignoresize
6367 && i.tm.opcode_modifier.no_qsuf
6368 && !i.tm.opcode_modifier.todword
6369 && !i.tm.opcode_modifier.toqword)
6370 i.suffix = 0;
6371 else if (!check_qword_reg ())
6372 return 0;
6373 }
6374 else if (i.suffix == WORD_MNEM_SUFFIX)
6375 {
6376 if (intel_syntax
6377 && i.tm.opcode_modifier.ignoresize
6378 && i.tm.opcode_modifier.no_wsuf)
6379 i.suffix = 0;
6380 else if (!check_word_reg ())
6381 return 0;
6382 }
6383 else if (intel_syntax && i.tm.opcode_modifier.ignoresize)
6384 /* Do nothing if the instruction is going to ignore the prefix. */
6385 ;
6386 else
6387 abort ();
6388 }
6389 else if (i.tm.opcode_modifier.defaultsize && !i.suffix)
6390 {
6391 i.suffix = stackop_size;
6392 if (stackop_size == LONG_MNEM_SUFFIX)
6393 {
6394 /* stackop_size is set to LONG_MNEM_SUFFIX for the
6395 .code16gcc directive to support 16-bit mode with
6396 32-bit address. For IRET without a suffix, generate
6397 16-bit IRET (opcode 0xcf) to return from an interrupt
6398 handler. */
6399 if (i.tm.base_opcode == 0xcf)
6400 {
6401 i.suffix = WORD_MNEM_SUFFIX;
6402 as_warn (_("generating 16-bit `iret' for .code16gcc directive"));
6403 }
6404 /* Warn about changed behavior for segment register push/pop. */
6405 else if ((i.tm.base_opcode | 1) == 0x07)
6406 as_warn (_("generating 32-bit `%s', unlike earlier gas versions"),
6407 i.tm.name);
6408 }
6409 }
6410 else if (!i.suffix
6411 && (i.tm.opcode_modifier.jump == JUMP_ABSOLUTE
6412 || i.tm.opcode_modifier.jump == JUMP_BYTE
6413 || i.tm.opcode_modifier.jump == JUMP_INTERSEGMENT
6414 || (i.tm.base_opcode == 0x0f01 /* [ls][gi]dt */
6415 && i.tm.extension_opcode <= 3)))
6416 {
6417 switch (flag_code)
6418 {
6419 case CODE_64BIT:
6420 if (!i.tm.opcode_modifier.no_qsuf)
6421 {
6422 i.suffix = QWORD_MNEM_SUFFIX;
6423 break;
6424 }
6425 /* Fall through. */
6426 case CODE_32BIT:
6427 if (!i.tm.opcode_modifier.no_lsuf)
6428 i.suffix = LONG_MNEM_SUFFIX;
6429 break;
6430 case CODE_16BIT:
6431 if (!i.tm.opcode_modifier.no_wsuf)
6432 i.suffix = WORD_MNEM_SUFFIX;
6433 break;
6434 }
6435 }
6436
6437 if (!i.suffix
6438 && (!i.tm.opcode_modifier.defaultsize
6439 /* Also cover lret/retf/iret in 64-bit mode. */
6440 || (flag_code == CODE_64BIT
6441 && !i.tm.opcode_modifier.no_lsuf
6442 && !i.tm.opcode_modifier.no_qsuf))
6443 && !i.tm.opcode_modifier.ignoresize
6444 /* Accept FLDENV et al without suffix. */
6445 && (i.tm.opcode_modifier.no_ssuf || i.tm.opcode_modifier.floatmf))
6446 {
6447 unsigned int suffixes, evex = 0;
6448
6449 suffixes = !i.tm.opcode_modifier.no_bsuf;
6450 if (!i.tm.opcode_modifier.no_wsuf)
6451 suffixes |= 1 << 1;
6452 if (!i.tm.opcode_modifier.no_lsuf)
6453 suffixes |= 1 << 2;
6454 if (!i.tm.opcode_modifier.no_ldsuf)
6455 suffixes |= 1 << 3;
6456 if (!i.tm.opcode_modifier.no_ssuf)
6457 suffixes |= 1 << 4;
6458 if (flag_code == CODE_64BIT && !i.tm.opcode_modifier.no_qsuf)
6459 suffixes |= 1 << 5;
6460
6461 /* For [XYZ]MMWORD operands inspect operand sizes. While generally
6462 also suitable for AT&T syntax mode, it was requested that this be
6463 restricted to just Intel syntax. */
6464 if (intel_syntax)
6465 {
6466 i386_cpu_flags cpu = cpu_flags_and (i.tm.cpu_flags, avx512);
6467
6468 if (!cpu_flags_all_zero (&cpu) && !i.broadcast)
6469 {
6470 unsigned int op;
6471
6472 for (op = 0; op < i.tm.operands; ++op)
6473 {
6474 if (!cpu_arch_flags.bitfield.cpuavx512vl)
6475 {
6476 if (i.tm.operand_types[op].bitfield.ymmword)
6477 i.tm.operand_types[op].bitfield.xmmword = 0;
6478 if (i.tm.operand_types[op].bitfield.zmmword)
6479 i.tm.operand_types[op].bitfield.ymmword = 0;
6480 if (!i.tm.opcode_modifier.evex
6481 || i.tm.opcode_modifier.evex == EVEXDYN)
6482 i.tm.opcode_modifier.evex = EVEX512;
6483 }
6484
6485 if (i.tm.operand_types[op].bitfield.xmmword
6486 + i.tm.operand_types[op].bitfield.ymmword
6487 + i.tm.operand_types[op].bitfield.zmmword < 2)
6488 continue;
6489
6490 /* Any properly sized operand disambiguates the insn. */
6491 if (i.types[op].bitfield.xmmword
6492 || i.types[op].bitfield.ymmword
6493 || i.types[op].bitfield.zmmword)
6494 {
6495 suffixes &= ~(7 << 6);
6496 evex = 0;
6497 break;
6498 }
6499
6500 if ((i.flags[op] & Operand_Mem)
6501 && i.tm.operand_types[op].bitfield.unspecified)
6502 {
6503 if (i.tm.operand_types[op].bitfield.xmmword)
6504 suffixes |= 1 << 6;
6505 if (i.tm.operand_types[op].bitfield.ymmword)
6506 suffixes |= 1 << 7;
6507 if (i.tm.operand_types[op].bitfield.zmmword)
6508 suffixes |= 1 << 8;
6509 evex = EVEX512;
6510 }
6511 }
6512 }
6513 }
6514
6515 /* Are multiple suffixes / operand sizes allowed? */
6516 if (suffixes & (suffixes - 1))
6517 {
6518 if (intel_syntax
6519 && (!i.tm.opcode_modifier.defaultsize
6520 || operand_check == check_error))
6521 {
6522 as_bad (_("ambiguous operand size for `%s'"), i.tm.name);
6523 return 0;
6524 }
6525 if (operand_check == check_error)
6526 {
6527 as_bad (_("no instruction mnemonic suffix given and "
6528 "no register operands; can't size `%s'"), i.tm.name);
6529 return 0;
6530 }
6531 if (operand_check == check_warning)
6532 as_warn (_("%s; using default for `%s'"),
6533 intel_syntax
6534 ? _("ambiguous operand size")
6535 : _("no instruction mnemonic suffix given and "
6536 "no register operands"),
6537 i.tm.name);
6538
6539 if (i.tm.opcode_modifier.floatmf)
6540 i.suffix = SHORT_MNEM_SUFFIX;
6541 else if (evex)
6542 i.tm.opcode_modifier.evex = evex;
6543 else if (flag_code == CODE_16BIT)
6544 i.suffix = WORD_MNEM_SUFFIX;
6545 else if (!i.tm.opcode_modifier.no_lsuf)
6546 i.suffix = LONG_MNEM_SUFFIX;
6547 else
6548 i.suffix = QWORD_MNEM_SUFFIX;
6549 }
6550 }
6551
6552 if (!i.tm.opcode_modifier.modrm && i.reg_operands && i.tm.operands < 3)
6553 i.short_form = (i.tm.operand_types[0].bitfield.class == Reg)
6554 != (i.tm.operand_types[1].bitfield.class == Reg);
6555
6556 /* Change the opcode based on the operand size given by i.suffix. */
6557 switch (i.suffix)
6558 {
6559 /* Size floating point instruction. */
6560 case LONG_MNEM_SUFFIX:
6561 if (i.tm.opcode_modifier.floatmf)
6562 {
6563 i.tm.base_opcode ^= 4;
6564 break;
6565 }
6566 /* fall through */
6567 case WORD_MNEM_SUFFIX:
6568 case QWORD_MNEM_SUFFIX:
6569 /* It's not a byte, select word/dword operation. */
6570 if (i.tm.opcode_modifier.w)
6571 {
6572 if (i.short_form)
6573 i.tm.base_opcode |= 8;
6574 else
6575 i.tm.base_opcode |= 1;
6576 }
6577 /* fall through */
6578 case SHORT_MNEM_SUFFIX:
6579 /* Now select between word & dword operations via the operand
6580 size prefix, except for instructions that will ignore this
6581 prefix anyway. */
6582 if (i.reg_operands > 0
6583 && i.types[0].bitfield.class == Reg
6584 && i.tm.opcode_modifier.addrprefixopreg
6585 && (i.tm.operand_types[0].bitfield.instance == Accum
6586 || i.operands == 1))
6587 {
6588 /* The address size override prefix changes the size of the
6589 first operand. */
6590 if ((flag_code == CODE_32BIT
6591 && i.op[0].regs->reg_type.bitfield.word)
6592 || (flag_code != CODE_32BIT
6593 && i.op[0].regs->reg_type.bitfield.dword))
6594 if (!add_prefix (ADDR_PREFIX_OPCODE))
6595 return 0;
6596 }
6597 else if (i.suffix != QWORD_MNEM_SUFFIX
6598 && !i.tm.opcode_modifier.ignoresize
6599 && !i.tm.opcode_modifier.floatmf
6600 && !is_any_vex_encoding (&i.tm)
6601 && ((i.suffix == LONG_MNEM_SUFFIX) == (flag_code == CODE_16BIT)
6602 || (flag_code == CODE_64BIT
6603 && i.tm.opcode_modifier.jump == JUMP_BYTE)))
6604 {
6605 unsigned int prefix = DATA_PREFIX_OPCODE;
6606
6607 if (i.tm.opcode_modifier.jump == JUMP_BYTE) /* jcxz, loop */
6608 prefix = ADDR_PREFIX_OPCODE;
6609
6610 if (!add_prefix (prefix))
6611 return 0;
6612 }
6613
6614 /* Set mode64 for an operand. */
6615 if (i.suffix == QWORD_MNEM_SUFFIX
6616 && flag_code == CODE_64BIT
6617 && !i.tm.opcode_modifier.norex64
6618 /* Special case for xchg %rax,%rax. It is NOP and doesn't
6619 need rex64. */
6620 && ! (i.operands == 2
6621 && i.tm.base_opcode == 0x90
6622 && i.tm.extension_opcode == None
6623 && i.types[0].bitfield.instance == Accum
6624 && i.types[0].bitfield.qword
6625 && i.types[1].bitfield.instance == Accum
6626 && i.types[1].bitfield.qword))
6627 i.rex |= REX_W;
6628
6629 break;
6630 }
6631
6632 if (i.reg_operands != 0
6633 && i.operands > 1
6634 && i.tm.opcode_modifier.addrprefixopreg
6635 && i.tm.operand_types[0].bitfield.instance != Accum)
6636 {
6637 /* Check invalid register operand when the address size override
6638 prefix changes the size of register operands. */
6639 unsigned int op;
6640 enum { need_word, need_dword, need_qword } need;
6641
6642 if (flag_code == CODE_32BIT)
6643 need = i.prefix[ADDR_PREFIX] ? need_word : need_dword;
6644 else
6645 {
6646 if (i.prefix[ADDR_PREFIX])
6647 need = need_dword;
6648 else
6649 need = flag_code == CODE_64BIT ? need_qword : need_word;
6650 }
6651
6652 for (op = 0; op < i.operands; op++)
6653 if (i.types[op].bitfield.class == Reg
6654 && ((need == need_word
6655 && !i.op[op].regs->reg_type.bitfield.word)
6656 || (need == need_dword
6657 && !i.op[op].regs->reg_type.bitfield.dword)
6658 || (need == need_qword
6659 && !i.op[op].regs->reg_type.bitfield.qword)))
6660 {
6661 as_bad (_("invalid register operand size for `%s'"),
6662 i.tm.name);
6663 return 0;
6664 }
6665 }
6666
6667 return 1;
6668 }
6669
6670 static int
6671 check_byte_reg (void)
6672 {
6673 int op;
6674
6675 for (op = i.operands; --op >= 0;)
6676 {
6677 /* Skip non-register operands. */
6678 if (i.types[op].bitfield.class != Reg)
6679 continue;
6680
6681 /* If this is an eight bit register, it's OK. If it's the 16 or
6682 32 bit version of an eight bit register, we will just use the
6683 low portion, and that's OK too. */
6684 if (i.types[op].bitfield.byte)
6685 continue;
6686
6687 /* I/O port address operands are OK too. */
6688 if (i.tm.operand_types[op].bitfield.instance == RegD
6689 && i.tm.operand_types[op].bitfield.word)
6690 continue;
6691
6692 /* crc32 only wants its source operand checked here. */
6693 if (i.tm.base_opcode == 0xf20f38f0 && op)
6694 continue;
6695
6696 /* Any other register is bad. */
6697 if (i.types[op].bitfield.class == Reg
6698 || i.types[op].bitfield.class == RegMMX
6699 || i.types[op].bitfield.class == RegSIMD
6700 || i.types[op].bitfield.class == SReg
6701 || i.types[op].bitfield.class == RegCR
6702 || i.types[op].bitfield.class == RegDR
6703 || i.types[op].bitfield.class == RegTR)
6704 {
6705 as_bad (_("`%s%s' not allowed with `%s%c'"),
6706 register_prefix,
6707 i.op[op].regs->reg_name,
6708 i.tm.name,
6709 i.suffix);
6710 return 0;
6711 }
6712 }
6713 return 1;
6714 }
6715
6716 static int
6717 check_long_reg (void)
6718 {
6719 int op;
6720
6721 for (op = i.operands; --op >= 0;)
6722 /* Skip non-register operands. */
6723 if (i.types[op].bitfield.class != Reg)
6724 continue;
6725 /* Reject eight bit registers, except where the template requires
6726 them. (eg. movzb) */
6727 else if (i.types[op].bitfield.byte
6728 && (i.tm.operand_types[op].bitfield.class == Reg
6729 || i.tm.operand_types[op].bitfield.instance == Accum)
6730 && (i.tm.operand_types[op].bitfield.word
6731 || i.tm.operand_types[op].bitfield.dword))
6732 {
6733 as_bad (_("`%s%s' not allowed with `%s%c'"),
6734 register_prefix,
6735 i.op[op].regs->reg_name,
6736 i.tm.name,
6737 i.suffix);
6738 return 0;
6739 }
6740 /* Error if the e prefix on a general reg is missing. */
6741 else if (i.types[op].bitfield.word
6742 && (i.tm.operand_types[op].bitfield.class == Reg
6743 || i.tm.operand_types[op].bitfield.instance == Accum)
6744 && i.tm.operand_types[op].bitfield.dword)
6745 {
6746 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
6747 register_prefix, i.op[op].regs->reg_name,
6748 i.suffix);
6749 return 0;
6750 }
6751 /* Warn if the r prefix on a general reg is present. */
6752 else if (i.types[op].bitfield.qword
6753 && (i.tm.operand_types[op].bitfield.class == Reg
6754 || i.tm.operand_types[op].bitfield.instance == Accum)
6755 && i.tm.operand_types[op].bitfield.dword)
6756 {
6757 if (intel_syntax
6758 && (i.tm.opcode_modifier.toqword
6759 /* Also convert to QWORD for MOVSXD. */
6760 || i.tm.base_opcode == 0x63)
6761 && i.types[0].bitfield.class != RegSIMD)
6762 {
6763 /* Convert to QWORD. We want REX byte. */
6764 i.suffix = QWORD_MNEM_SUFFIX;
6765 }
6766 else
6767 {
6768 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
6769 register_prefix, i.op[op].regs->reg_name,
6770 i.suffix);
6771 return 0;
6772 }
6773 }
6774 return 1;
6775 }
6776
6777 static int
6778 check_qword_reg (void)
6779 {
6780 int op;
6781
6782 for (op = i.operands; --op >= 0; )
6783 /* Skip non-register operands. */
6784 if (i.types[op].bitfield.class != Reg)
6785 continue;
6786 /* Reject eight bit registers, except where the template requires
6787 them. (eg. movzb) */
6788 else if (i.types[op].bitfield.byte
6789 && (i.tm.operand_types[op].bitfield.class == Reg
6790 || i.tm.operand_types[op].bitfield.instance == Accum)
6791 && (i.tm.operand_types[op].bitfield.word
6792 || i.tm.operand_types[op].bitfield.dword))
6793 {
6794 as_bad (_("`%s%s' not allowed with `%s%c'"),
6795 register_prefix,
6796 i.op[op].regs->reg_name,
6797 i.tm.name,
6798 i.suffix);
6799 return 0;
6800 }
6801 /* Warn if the r prefix on a general reg is missing. */
6802 else if ((i.types[op].bitfield.word
6803 || i.types[op].bitfield.dword)
6804 && (i.tm.operand_types[op].bitfield.class == Reg
6805 || i.tm.operand_types[op].bitfield.instance == Accum)
6806 && i.tm.operand_types[op].bitfield.qword)
6807 {
6808 /* Prohibit these changes in the 64bit mode, since the
6809 lowering is more complicated. */
6810 if (intel_syntax
6811 && i.tm.opcode_modifier.todword
6812 && i.types[0].bitfield.class != RegSIMD)
6813 {
6814 /* Convert to DWORD. We don't want REX byte. */
6815 i.suffix = LONG_MNEM_SUFFIX;
6816 }
6817 else
6818 {
6819 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
6820 register_prefix, i.op[op].regs->reg_name,
6821 i.suffix);
6822 return 0;
6823 }
6824 }
6825 return 1;
6826 }
6827
6828 static int
6829 check_word_reg (void)
6830 {
6831 int op;
6832 for (op = i.operands; --op >= 0;)
6833 /* Skip non-register operands. */
6834 if (i.types[op].bitfield.class != Reg)
6835 continue;
6836 /* Reject eight bit registers, except where the template requires
6837 them. (eg. movzb) */
6838 else if (i.types[op].bitfield.byte
6839 && (i.tm.operand_types[op].bitfield.class == Reg
6840 || i.tm.operand_types[op].bitfield.instance == Accum)
6841 && (i.tm.operand_types[op].bitfield.word
6842 || i.tm.operand_types[op].bitfield.dword))
6843 {
6844 as_bad (_("`%s%s' not allowed with `%s%c'"),
6845 register_prefix,
6846 i.op[op].regs->reg_name,
6847 i.tm.name,
6848 i.suffix);
6849 return 0;
6850 }
6851 /* Error if the e or r prefix on a general reg is present. */
6852 else if ((i.types[op].bitfield.dword
6853 || i.types[op].bitfield.qword)
6854 && (i.tm.operand_types[op].bitfield.class == Reg
6855 || i.tm.operand_types[op].bitfield.instance == Accum)
6856 && i.tm.operand_types[op].bitfield.word)
6857 {
6858 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
6859 register_prefix, i.op[op].regs->reg_name,
6860 i.suffix);
6861 return 0;
6862 }
6863 return 1;
6864 }
6865
6866 static int
6867 update_imm (unsigned int j)
6868 {
6869 i386_operand_type overlap = i.types[j];
6870 if ((overlap.bitfield.imm8
6871 || overlap.bitfield.imm8s
6872 || overlap.bitfield.imm16
6873 || overlap.bitfield.imm32
6874 || overlap.bitfield.imm32s
6875 || overlap.bitfield.imm64)
6876 && !operand_type_equal (&overlap, &imm8)
6877 && !operand_type_equal (&overlap, &imm8s)
6878 && !operand_type_equal (&overlap, &imm16)
6879 && !operand_type_equal (&overlap, &imm32)
6880 && !operand_type_equal (&overlap, &imm32s)
6881 && !operand_type_equal (&overlap, &imm64))
6882 {
6883 if (i.suffix)
6884 {
6885 i386_operand_type temp;
6886
6887 operand_type_set (&temp, 0);
6888 if (i.suffix == BYTE_MNEM_SUFFIX)
6889 {
6890 temp.bitfield.imm8 = overlap.bitfield.imm8;
6891 temp.bitfield.imm8s = overlap.bitfield.imm8s;
6892 }
6893 else if (i.suffix == WORD_MNEM_SUFFIX)
6894 temp.bitfield.imm16 = overlap.bitfield.imm16;
6895 else if (i.suffix == QWORD_MNEM_SUFFIX)
6896 {
6897 temp.bitfield.imm64 = overlap.bitfield.imm64;
6898 temp.bitfield.imm32s = overlap.bitfield.imm32s;
6899 }
6900 else
6901 temp.bitfield.imm32 = overlap.bitfield.imm32;
6902 overlap = temp;
6903 }
6904 else if (operand_type_equal (&overlap, &imm16_32_32s)
6905 || operand_type_equal (&overlap, &imm16_32)
6906 || operand_type_equal (&overlap, &imm16_32s))
6907 {
6908 if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
6909 overlap = imm16;
6910 else
6911 overlap = imm32s;
6912 }
6913 if (!operand_type_equal (&overlap, &imm8)
6914 && !operand_type_equal (&overlap, &imm8s)
6915 && !operand_type_equal (&overlap, &imm16)
6916 && !operand_type_equal (&overlap, &imm32)
6917 && !operand_type_equal (&overlap, &imm32s)
6918 && !operand_type_equal (&overlap, &imm64))
6919 {
6920 as_bad (_("no instruction mnemonic suffix given; "
6921 "can't determine immediate size"));
6922 return 0;
6923 }
6924 }
6925 i.types[j] = overlap;
6926
6927 return 1;
6928 }
6929
6930 static int
6931 finalize_imm (void)
6932 {
6933 unsigned int j, n;
6934
6935 /* Update the first 2 immediate operands. */
6936 n = i.operands > 2 ? 2 : i.operands;
6937 if (n)
6938 {
6939 for (j = 0; j < n; j++)
6940 if (update_imm (j) == 0)
6941 return 0;
6942
6943 /* The 3rd operand can't be immediate operand. */
6944 gas_assert (operand_type_check (i.types[2], imm) == 0);
6945 }
6946
6947 return 1;
6948 }
6949
6950 static int
6951 process_operands (void)
6952 {
6953 /* Default segment register this instruction will use for memory
6954 accesses. 0 means unknown. This is only for optimizing out
6955 unnecessary segment overrides. */
6956 const seg_entry *default_seg = 0;
6957
6958 if (i.tm.opcode_modifier.sse2avx && i.tm.opcode_modifier.vexvvvv)
6959 {
6960 unsigned int dupl = i.operands;
6961 unsigned int dest = dupl - 1;
6962 unsigned int j;
6963
6964 /* The destination must be an xmm register. */
6965 gas_assert (i.reg_operands
6966 && MAX_OPERANDS > dupl
6967 && operand_type_equal (&i.types[dest], &regxmm));
6968
6969 if (i.tm.operand_types[0].bitfield.instance == Accum
6970 && i.tm.operand_types[0].bitfield.xmmword)
6971 {
6972 if (i.tm.opcode_modifier.vexsources == VEX3SOURCES)
6973 {
6974 /* Keep xmm0 for instructions with VEX prefix and 3
6975 sources. */
6976 i.tm.operand_types[0].bitfield.instance = InstanceNone;
6977 i.tm.operand_types[0].bitfield.class = RegSIMD;
6978 goto duplicate;
6979 }
6980 else
6981 {
6982 /* We remove the first xmm0 and keep the number of
6983 operands unchanged, which in fact duplicates the
6984 destination. */
6985 for (j = 1; j < i.operands; j++)
6986 {
6987 i.op[j - 1] = i.op[j];
6988 i.types[j - 1] = i.types[j];
6989 i.tm.operand_types[j - 1] = i.tm.operand_types[j];
6990 i.flags[j - 1] = i.flags[j];
6991 }
6992 }
6993 }
6994 else if (i.tm.opcode_modifier.implicit1stxmm0)
6995 {
6996 gas_assert ((MAX_OPERANDS - 1) > dupl
6997 && (i.tm.opcode_modifier.vexsources
6998 == VEX3SOURCES));
6999
7000 /* Add the implicit xmm0 for instructions with VEX prefix
7001 and 3 sources. */
7002 for (j = i.operands; j > 0; j--)
7003 {
7004 i.op[j] = i.op[j - 1];
7005 i.types[j] = i.types[j - 1];
7006 i.tm.operand_types[j] = i.tm.operand_types[j - 1];
7007 i.flags[j] = i.flags[j - 1];
7008 }
7009 i.op[0].regs
7010 = (const reg_entry *) hash_find (reg_hash, "xmm0");
7011 i.types[0] = regxmm;
7012 i.tm.operand_types[0] = regxmm;
7013
7014 i.operands += 2;
7015 i.reg_operands += 2;
7016 i.tm.operands += 2;
7017
7018 dupl++;
7019 dest++;
7020 i.op[dupl] = i.op[dest];
7021 i.types[dupl] = i.types[dest];
7022 i.tm.operand_types[dupl] = i.tm.operand_types[dest];
7023 i.flags[dupl] = i.flags[dest];
7024 }
7025 else
7026 {
7027 duplicate:
7028 i.operands++;
7029 i.reg_operands++;
7030 i.tm.operands++;
7031
7032 i.op[dupl] = i.op[dest];
7033 i.types[dupl] = i.types[dest];
7034 i.tm.operand_types[dupl] = i.tm.operand_types[dest];
7035 i.flags[dupl] = i.flags[dest];
7036 }
7037
7038 if (i.tm.opcode_modifier.immext)
7039 process_immext ();
7040 }
7041 else if (i.tm.operand_types[0].bitfield.instance == Accum
7042 && i.tm.operand_types[0].bitfield.xmmword)
7043 {
7044 unsigned int j;
7045
7046 for (j = 1; j < i.operands; j++)
7047 {
7048 i.op[j - 1] = i.op[j];
7049 i.types[j - 1] = i.types[j];
7050
7051 /* We need to adjust fields in i.tm since they are used by
7052 build_modrm_byte. */
7053 i.tm.operand_types [j - 1] = i.tm.operand_types [j];
7054
7055 i.flags[j - 1] = i.flags[j];
7056 }
7057
7058 i.operands--;
7059 i.reg_operands--;
7060 i.tm.operands--;
7061 }
7062 else if (i.tm.opcode_modifier.implicitquadgroup)
7063 {
7064 unsigned int regnum, first_reg_in_group, last_reg_in_group;
7065
7066 /* The second operand must be {x,y,z}mmN, where N is a multiple of 4. */
7067 gas_assert (i.operands >= 2 && i.types[1].bitfield.class == RegSIMD);
7068 regnum = register_number (i.op[1].regs);
7069 first_reg_in_group = regnum & ~3;
7070 last_reg_in_group = first_reg_in_group + 3;
7071 if (regnum != first_reg_in_group)
7072 as_warn (_("source register `%s%s' implicitly denotes"
7073 " `%s%.3s%u' to `%s%.3s%u' source group in `%s'"),
7074 register_prefix, i.op[1].regs->reg_name,
7075 register_prefix, i.op[1].regs->reg_name, first_reg_in_group,
7076 register_prefix, i.op[1].regs->reg_name, last_reg_in_group,
7077 i.tm.name);
7078 }
7079 else if (i.tm.opcode_modifier.regkludge)
7080 {
7081 /* The imul $imm, %reg instruction is converted into
7082 imul $imm, %reg, %reg, and the clr %reg instruction
7083 is converted into xor %reg, %reg. */
7084
7085 unsigned int first_reg_op;
7086
7087 if (operand_type_check (i.types[0], reg))
7088 first_reg_op = 0;
7089 else
7090 first_reg_op = 1;
7091 /* Pretend we saw the extra register operand. */
7092 gas_assert (i.reg_operands == 1
7093 && i.op[first_reg_op + 1].regs == 0);
7094 i.op[first_reg_op + 1].regs = i.op[first_reg_op].regs;
7095 i.types[first_reg_op + 1] = i.types[first_reg_op];
7096 i.operands++;
7097 i.reg_operands++;
7098 }
7099
7100 if (i.tm.opcode_modifier.modrm)
7101 {
7102 /* The opcode is completed (modulo i.tm.extension_opcode which
7103 must be put into the modrm byte). Now, we make the modrm and
7104 index base bytes based on all the info we've collected. */
7105
7106 default_seg = build_modrm_byte ();
7107 }
7108 else if (i.types[0].bitfield.class == SReg)
7109 {
7110 if (flag_code != CODE_64BIT
7111 ? i.tm.base_opcode == POP_SEG_SHORT
7112 && i.op[0].regs->reg_num == 1
7113 : (i.tm.base_opcode | 1) == POP_SEG386_SHORT
7114 && i.op[0].regs->reg_num < 4)
7115 {
7116 as_bad (_("you can't `%s %s%s'"),
7117 i.tm.name, register_prefix, i.op[0].regs->reg_name);
7118 return 0;
7119 }
7120 if ( i.op[0].regs->reg_num > 3 && i.tm.opcode_length == 1 )
7121 {
7122 i.tm.base_opcode ^= POP_SEG_SHORT ^ POP_SEG386_SHORT;
7123 i.tm.opcode_length = 2;
7124 }
7125 i.tm.base_opcode |= (i.op[0].regs->reg_num << 3);
7126 }
7127 else if ((i.tm.base_opcode & ~0x3) == MOV_AX_DISP32)
7128 {
7129 default_seg = &ds;
7130 }
7131 else if (i.tm.opcode_modifier.isstring)
7132 {
7133 /* For the string instructions that allow a segment override
7134 on one of their operands, the default segment is ds. */
7135 default_seg = &ds;
7136 }
7137 else if (i.short_form)
7138 {
7139 /* The register or float register operand is in operand
7140 0 or 1. */
7141 unsigned int op = i.tm.operand_types[0].bitfield.class != Reg;
7142
7143 /* Register goes in low 3 bits of opcode. */
7144 i.tm.base_opcode |= i.op[op].regs->reg_num;
7145 if ((i.op[op].regs->reg_flags & RegRex) != 0)
7146 i.rex |= REX_B;
7147 if (!quiet_warnings && i.tm.opcode_modifier.ugh)
7148 {
7149 /* Warn about some common errors, but press on regardless.
7150 The first case can be generated by gcc (<= 2.8.1). */
7151 if (i.operands == 2)
7152 {
7153 /* Reversed arguments on faddp, fsubp, etc. */
7154 as_warn (_("translating to `%s %s%s,%s%s'"), i.tm.name,
7155 register_prefix, i.op[!intel_syntax].regs->reg_name,
7156 register_prefix, i.op[intel_syntax].regs->reg_name);
7157 }
7158 else
7159 {
7160 /* Extraneous `l' suffix on fp insn. */
7161 as_warn (_("translating to `%s %s%s'"), i.tm.name,
7162 register_prefix, i.op[0].regs->reg_name);
7163 }
7164 }
7165 }
7166
7167 if ((i.seg[0] || i.prefix[SEG_PREFIX])
7168 && i.tm.base_opcode == 0x8d /* lea */
7169 && !is_any_vex_encoding(&i.tm))
7170 {
7171 if (!quiet_warnings)
7172 as_warn (_("segment override on `%s' is ineffectual"), i.tm.name);
7173 if (optimize)
7174 {
7175 i.seg[0] = NULL;
7176 i.prefix[SEG_PREFIX] = 0;
7177 }
7178 }
7179
7180 /* If a segment was explicitly specified, and the specified segment
7181 is not the default, use an opcode prefix to select it. If we
7182 never figured out what the default segment is, then default_seg
7183 will be zero at this point, and the specified segment prefix will
7184 always be used. */
7185 if ((i.seg[0]) && (i.seg[0] != default_seg))
7186 {
7187 if (!add_prefix (i.seg[0]->seg_prefix))
7188 return 0;
7189 }
7190 return 1;
7191 }
7192
7193 static const seg_entry *
7194 build_modrm_byte (void)
7195 {
7196 const seg_entry *default_seg = 0;
7197 unsigned int source, dest;
7198 int vex_3_sources;
7199
7200 vex_3_sources = i.tm.opcode_modifier.vexsources == VEX3SOURCES;
7201 if (vex_3_sources)
7202 {
7203 unsigned int nds, reg_slot;
7204 expressionS *exp;
7205
7206 dest = i.operands - 1;
7207 nds = dest - 1;
7208
7209 /* There are 2 kinds of instructions:
7210 1. 5 operands: 4 register operands or 3 register operands
7211 plus 1 memory operand plus one Imm4 operand, VexXDS, and
7212 VexW0 or VexW1. The destination must be either XMM, YMM or
7213 ZMM register.
7214 2. 4 operands: 4 register operands or 3 register operands
7215 plus 1 memory operand, with VexXDS. */
7216 gas_assert ((i.reg_operands == 4
7217 || (i.reg_operands == 3 && i.mem_operands == 1))
7218 && i.tm.opcode_modifier.vexvvvv == VEXXDS
7219 && i.tm.opcode_modifier.vexw
7220 && i.tm.operand_types[dest].bitfield.class == RegSIMD);
7221
7222 /* If VexW1 is set, the first non-immediate operand is the source and
7223 the second non-immediate one is encoded in the immediate operand. */
7224 if (i.tm.opcode_modifier.vexw == VEXW1)
7225 {
7226 source = i.imm_operands;
7227 reg_slot = i.imm_operands + 1;
7228 }
7229 else
7230 {
7231 source = i.imm_operands + 1;
7232 reg_slot = i.imm_operands;
7233 }
7234
7235 if (i.imm_operands == 0)
7236 {
7237 /* When there is no immediate operand, generate an 8bit
7238 immediate operand to encode the first operand. */
7239 exp = &im_expressions[i.imm_operands++];
7240 i.op[i.operands].imms = exp;
7241 i.types[i.operands] = imm8;
7242 i.operands++;
7243
7244 gas_assert (i.tm.operand_types[reg_slot].bitfield.class == RegSIMD);
7245 exp->X_op = O_constant;
7246 exp->X_add_number = register_number (i.op[reg_slot].regs) << 4;
7247 gas_assert ((i.op[reg_slot].regs->reg_flags & RegVRex) == 0);
7248 }
7249 else
7250 {
7251 gas_assert (i.imm_operands == 1);
7252 gas_assert (fits_in_imm4 (i.op[0].imms->X_add_number));
7253 gas_assert (!i.tm.opcode_modifier.immext);
7254
7255 /* Turn on Imm8 again so that output_imm will generate it. */
7256 i.types[0].bitfield.imm8 = 1;
7257
7258 gas_assert (i.tm.operand_types[reg_slot].bitfield.class == RegSIMD);
7259 i.op[0].imms->X_add_number
7260 |= register_number (i.op[reg_slot].regs) << 4;
7261 gas_assert ((i.op[reg_slot].regs->reg_flags & RegVRex) == 0);
7262 }
7263
7264 gas_assert (i.tm.operand_types[nds].bitfield.class == RegSIMD);
7265 i.vex.register_specifier = i.op[nds].regs;
7266 }
7267 else
7268 source = dest = 0;
7269
7270 /* i.reg_operands MUST be the number of real register operands;
7271 implicit registers do not count. If there are 3 register
7272 operands, it must be a instruction with VexNDS. For a
7273 instruction with VexNDD, the destination register is encoded
7274 in VEX prefix. If there are 4 register operands, it must be
7275 a instruction with VEX prefix and 3 sources. */
7276 if (i.mem_operands == 0
7277 && ((i.reg_operands == 2
7278 && i.tm.opcode_modifier.vexvvvv <= VEXXDS)
7279 || (i.reg_operands == 3
7280 && i.tm.opcode_modifier.vexvvvv == VEXXDS)
7281 || (i.reg_operands == 4 && vex_3_sources)))
7282 {
7283 switch (i.operands)
7284 {
7285 case 2:
7286 source = 0;
7287 break;
7288 case 3:
7289 /* When there are 3 operands, one of them may be immediate,
7290 which may be the first or the last operand. Otherwise,
7291 the first operand must be shift count register (cl) or it
7292 is an instruction with VexNDS. */
7293 gas_assert (i.imm_operands == 1
7294 || (i.imm_operands == 0
7295 && (i.tm.opcode_modifier.vexvvvv == VEXXDS
7296 || (i.types[0].bitfield.instance == RegC
7297 && i.types[0].bitfield.byte))));
7298 if (operand_type_check (i.types[0], imm)
7299 || (i.types[0].bitfield.instance == RegC
7300 && i.types[0].bitfield.byte))
7301 source = 1;
7302 else
7303 source = 0;
7304 break;
7305 case 4:
7306 /* When there are 4 operands, the first two must be 8bit
7307 immediate operands. The source operand will be the 3rd
7308 one.
7309
7310 For instructions with VexNDS, if the first operand
7311 an imm8, the source operand is the 2nd one. If the last
7312 operand is imm8, the source operand is the first one. */
7313 gas_assert ((i.imm_operands == 2
7314 && i.types[0].bitfield.imm8
7315 && i.types[1].bitfield.imm8)
7316 || (i.tm.opcode_modifier.vexvvvv == VEXXDS
7317 && i.imm_operands == 1
7318 && (i.types[0].bitfield.imm8
7319 || i.types[i.operands - 1].bitfield.imm8
7320 || i.rounding)));
7321 if (i.imm_operands == 2)
7322 source = 2;
7323 else
7324 {
7325 if (i.types[0].bitfield.imm8)
7326 source = 1;
7327 else
7328 source = 0;
7329 }
7330 break;
7331 case 5:
7332 if (is_evex_encoding (&i.tm))
7333 {
7334 /* For EVEX instructions, when there are 5 operands, the
7335 first one must be immediate operand. If the second one
7336 is immediate operand, the source operand is the 3th
7337 one. If the last one is immediate operand, the source
7338 operand is the 2nd one. */
7339 gas_assert (i.imm_operands == 2
7340 && i.tm.opcode_modifier.sae
7341 && operand_type_check (i.types[0], imm));
7342 if (operand_type_check (i.types[1], imm))
7343 source = 2;
7344 else if (operand_type_check (i.types[4], imm))
7345 source = 1;
7346 else
7347 abort ();
7348 }
7349 break;
7350 default:
7351 abort ();
7352 }
7353
7354 if (!vex_3_sources)
7355 {
7356 dest = source + 1;
7357
7358 /* RC/SAE operand could be between DEST and SRC. That happens
7359 when one operand is GPR and the other one is XMM/YMM/ZMM
7360 register. */
7361 if (i.rounding && i.rounding->operand == (int) dest)
7362 dest++;
7363
7364 if (i.tm.opcode_modifier.vexvvvv == VEXXDS)
7365 {
7366 /* For instructions with VexNDS, the register-only source
7367 operand must be a 32/64bit integer, XMM, YMM, ZMM, or mask
7368 register. It is encoded in VEX prefix. */
7369
7370 i386_operand_type op;
7371 unsigned int vvvv;
7372
7373 /* Check register-only source operand when two source
7374 operands are swapped. */
7375 if (!i.tm.operand_types[source].bitfield.baseindex
7376 && i.tm.operand_types[dest].bitfield.baseindex)
7377 {
7378 vvvv = source;
7379 source = dest;
7380 }
7381 else
7382 vvvv = dest;
7383
7384 op = i.tm.operand_types[vvvv];
7385 if ((dest + 1) >= i.operands
7386 || ((op.bitfield.class != Reg
7387 || (!op.bitfield.dword && !op.bitfield.qword))
7388 && op.bitfield.class != RegSIMD
7389 && !operand_type_equal (&op, &regmask)))
7390 abort ();
7391 i.vex.register_specifier = i.op[vvvv].regs;
7392 dest++;
7393 }
7394 }
7395
7396 i.rm.mode = 3;
7397 /* One of the register operands will be encoded in the i.rm.reg
7398 field, the other in the combined i.rm.mode and i.rm.regmem
7399 fields. If no form of this instruction supports a memory
7400 destination operand, then we assume the source operand may
7401 sometimes be a memory operand and so we need to store the
7402 destination in the i.rm.reg field. */
7403 if (!i.tm.opcode_modifier.regmem
7404 && operand_type_check (i.tm.operand_types[dest], anymem) == 0)
7405 {
7406 i.rm.reg = i.op[dest].regs->reg_num;
7407 i.rm.regmem = i.op[source].regs->reg_num;
7408 if (i.op[dest].regs->reg_type.bitfield.class == RegMMX
7409 || i.op[source].regs->reg_type.bitfield.class == RegMMX)
7410 i.has_regmmx = TRUE;
7411 else if (i.op[dest].regs->reg_type.bitfield.class == RegSIMD
7412 || i.op[source].regs->reg_type.bitfield.class == RegSIMD)
7413 {
7414 if (i.types[dest].bitfield.zmmword
7415 || i.types[source].bitfield.zmmword)
7416 i.has_regzmm = TRUE;
7417 else if (i.types[dest].bitfield.ymmword
7418 || i.types[source].bitfield.ymmword)
7419 i.has_regymm = TRUE;
7420 else
7421 i.has_regxmm = TRUE;
7422 }
7423 if ((i.op[dest].regs->reg_flags & RegRex) != 0)
7424 i.rex |= REX_R;
7425 if ((i.op[dest].regs->reg_flags & RegVRex) != 0)
7426 i.vrex |= REX_R;
7427 if ((i.op[source].regs->reg_flags & RegRex) != 0)
7428 i.rex |= REX_B;
7429 if ((i.op[source].regs->reg_flags & RegVRex) != 0)
7430 i.vrex |= REX_B;
7431 }
7432 else
7433 {
7434 i.rm.reg = i.op[source].regs->reg_num;
7435 i.rm.regmem = i.op[dest].regs->reg_num;
7436 if ((i.op[dest].regs->reg_flags & RegRex) != 0)
7437 i.rex |= REX_B;
7438 if ((i.op[dest].regs->reg_flags & RegVRex) != 0)
7439 i.vrex |= REX_B;
7440 if ((i.op[source].regs->reg_flags & RegRex) != 0)
7441 i.rex |= REX_R;
7442 if ((i.op[source].regs->reg_flags & RegVRex) != 0)
7443 i.vrex |= REX_R;
7444 }
7445 if (flag_code != CODE_64BIT && (i.rex & REX_R))
7446 {
7447 if (i.types[!i.tm.opcode_modifier.regmem].bitfield.class != RegCR)
7448 abort ();
7449 i.rex &= ~REX_R;
7450 add_prefix (LOCK_PREFIX_OPCODE);
7451 }
7452 }
7453 else
7454 { /* If it's not 2 reg operands... */
7455 unsigned int mem;
7456
7457 if (i.mem_operands)
7458 {
7459 unsigned int fake_zero_displacement = 0;
7460 unsigned int op;
7461
7462 for (op = 0; op < i.operands; op++)
7463 if (i.flags[op] & Operand_Mem)
7464 break;
7465 gas_assert (op < i.operands);
7466
7467 if (i.tm.opcode_modifier.vecsib)
7468 {
7469 if (i.index_reg->reg_num == RegIZ)
7470 abort ();
7471
7472 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
7473 if (!i.base_reg)
7474 {
7475 i.sib.base = NO_BASE_REGISTER;
7476 i.sib.scale = i.log2_scale_factor;
7477 i.types[op].bitfield.disp8 = 0;
7478 i.types[op].bitfield.disp16 = 0;
7479 i.types[op].bitfield.disp64 = 0;
7480 if (flag_code != CODE_64BIT || i.prefix[ADDR_PREFIX])
7481 {
7482 /* Must be 32 bit */
7483 i.types[op].bitfield.disp32 = 1;
7484 i.types[op].bitfield.disp32s = 0;
7485 }
7486 else
7487 {
7488 i.types[op].bitfield.disp32 = 0;
7489 i.types[op].bitfield.disp32s = 1;
7490 }
7491 }
7492 i.sib.index = i.index_reg->reg_num;
7493 if ((i.index_reg->reg_flags & RegRex) != 0)
7494 i.rex |= REX_X;
7495 if ((i.index_reg->reg_flags & RegVRex) != 0)
7496 i.vrex |= REX_X;
7497 }
7498
7499 default_seg = &ds;
7500
7501 if (i.base_reg == 0)
7502 {
7503 i.rm.mode = 0;
7504 if (!i.disp_operands)
7505 fake_zero_displacement = 1;
7506 if (i.index_reg == 0)
7507 {
7508 i386_operand_type newdisp;
7509
7510 gas_assert (!i.tm.opcode_modifier.vecsib);
7511 /* Operand is just <disp> */
7512 if (flag_code == CODE_64BIT)
7513 {
7514 /* 64bit mode overwrites the 32bit absolute
7515 addressing by RIP relative addressing and
7516 absolute addressing is encoded by one of the
7517 redundant SIB forms. */
7518 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
7519 i.sib.base = NO_BASE_REGISTER;
7520 i.sib.index = NO_INDEX_REGISTER;
7521 newdisp = (!i.prefix[ADDR_PREFIX] ? disp32s : disp32);
7522 }
7523 else if ((flag_code == CODE_16BIT)
7524 ^ (i.prefix[ADDR_PREFIX] != 0))
7525 {
7526 i.rm.regmem = NO_BASE_REGISTER_16;
7527 newdisp = disp16;
7528 }
7529 else
7530 {
7531 i.rm.regmem = NO_BASE_REGISTER;
7532 newdisp = disp32;
7533 }
7534 i.types[op] = operand_type_and_not (i.types[op], anydisp);
7535 i.types[op] = operand_type_or (i.types[op], newdisp);
7536 }
7537 else if (!i.tm.opcode_modifier.vecsib)
7538 {
7539 /* !i.base_reg && i.index_reg */
7540 if (i.index_reg->reg_num == RegIZ)
7541 i.sib.index = NO_INDEX_REGISTER;
7542 else
7543 i.sib.index = i.index_reg->reg_num;
7544 i.sib.base = NO_BASE_REGISTER;
7545 i.sib.scale = i.log2_scale_factor;
7546 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
7547 i.types[op].bitfield.disp8 = 0;
7548 i.types[op].bitfield.disp16 = 0;
7549 i.types[op].bitfield.disp64 = 0;
7550 if (flag_code != CODE_64BIT || i.prefix[ADDR_PREFIX])
7551 {
7552 /* Must be 32 bit */
7553 i.types[op].bitfield.disp32 = 1;
7554 i.types[op].bitfield.disp32s = 0;
7555 }
7556 else
7557 {
7558 i.types[op].bitfield.disp32 = 0;
7559 i.types[op].bitfield.disp32s = 1;
7560 }
7561 if ((i.index_reg->reg_flags & RegRex) != 0)
7562 i.rex |= REX_X;
7563 }
7564 }
7565 /* RIP addressing for 64bit mode. */
7566 else if (i.base_reg->reg_num == RegIP)
7567 {
7568 gas_assert (!i.tm.opcode_modifier.vecsib);
7569 i.rm.regmem = NO_BASE_REGISTER;
7570 i.types[op].bitfield.disp8 = 0;
7571 i.types[op].bitfield.disp16 = 0;
7572 i.types[op].bitfield.disp32 = 0;
7573 i.types[op].bitfield.disp32s = 1;
7574 i.types[op].bitfield.disp64 = 0;
7575 i.flags[op] |= Operand_PCrel;
7576 if (! i.disp_operands)
7577 fake_zero_displacement = 1;
7578 }
7579 else if (i.base_reg->reg_type.bitfield.word)
7580 {
7581 gas_assert (!i.tm.opcode_modifier.vecsib);
7582 switch (i.base_reg->reg_num)
7583 {
7584 case 3: /* (%bx) */
7585 if (i.index_reg == 0)
7586 i.rm.regmem = 7;
7587 else /* (%bx,%si) -> 0, or (%bx,%di) -> 1 */
7588 i.rm.regmem = i.index_reg->reg_num - 6;
7589 break;
7590 case 5: /* (%bp) */
7591 default_seg = &ss;
7592 if (i.index_reg == 0)
7593 {
7594 i.rm.regmem = 6;
7595 if (operand_type_check (i.types[op], disp) == 0)
7596 {
7597 /* fake (%bp) into 0(%bp) */
7598 i.types[op].bitfield.disp8 = 1;
7599 fake_zero_displacement = 1;
7600 }
7601 }
7602 else /* (%bp,%si) -> 2, or (%bp,%di) -> 3 */
7603 i.rm.regmem = i.index_reg->reg_num - 6 + 2;
7604 break;
7605 default: /* (%si) -> 4 or (%di) -> 5 */
7606 i.rm.regmem = i.base_reg->reg_num - 6 + 4;
7607 }
7608 i.rm.mode = mode_from_disp_size (i.types[op]);
7609 }
7610 else /* i.base_reg and 32/64 bit mode */
7611 {
7612 if (flag_code == CODE_64BIT
7613 && operand_type_check (i.types[op], disp))
7614 {
7615 i.types[op].bitfield.disp16 = 0;
7616 i.types[op].bitfield.disp64 = 0;
7617 if (i.prefix[ADDR_PREFIX] == 0)
7618 {
7619 i.types[op].bitfield.disp32 = 0;
7620 i.types[op].bitfield.disp32s = 1;
7621 }
7622 else
7623 {
7624 i.types[op].bitfield.disp32 = 1;
7625 i.types[op].bitfield.disp32s = 0;
7626 }
7627 }
7628
7629 if (!i.tm.opcode_modifier.vecsib)
7630 i.rm.regmem = i.base_reg->reg_num;
7631 if ((i.base_reg->reg_flags & RegRex) != 0)
7632 i.rex |= REX_B;
7633 i.sib.base = i.base_reg->reg_num;
7634 /* x86-64 ignores REX prefix bit here to avoid decoder
7635 complications. */
7636 if (!(i.base_reg->reg_flags & RegRex)
7637 && (i.base_reg->reg_num == EBP_REG_NUM
7638 || i.base_reg->reg_num == ESP_REG_NUM))
7639 default_seg = &ss;
7640 if (i.base_reg->reg_num == 5 && i.disp_operands == 0)
7641 {
7642 fake_zero_displacement = 1;
7643 i.types[op].bitfield.disp8 = 1;
7644 }
7645 i.sib.scale = i.log2_scale_factor;
7646 if (i.index_reg == 0)
7647 {
7648 gas_assert (!i.tm.opcode_modifier.vecsib);
7649 /* <disp>(%esp) becomes two byte modrm with no index
7650 register. We've already stored the code for esp
7651 in i.rm.regmem ie. ESCAPE_TO_TWO_BYTE_ADDRESSING.
7652 Any base register besides %esp will not use the
7653 extra modrm byte. */
7654 i.sib.index = NO_INDEX_REGISTER;
7655 }
7656 else if (!i.tm.opcode_modifier.vecsib)
7657 {
7658 if (i.index_reg->reg_num == RegIZ)
7659 i.sib.index = NO_INDEX_REGISTER;
7660 else
7661 i.sib.index = i.index_reg->reg_num;
7662 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
7663 if ((i.index_reg->reg_flags & RegRex) != 0)
7664 i.rex |= REX_X;
7665 }
7666
7667 if (i.disp_operands
7668 && (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
7669 || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL))
7670 i.rm.mode = 0;
7671 else
7672 {
7673 if (!fake_zero_displacement
7674 && !i.disp_operands
7675 && i.disp_encoding)
7676 {
7677 fake_zero_displacement = 1;
7678 if (i.disp_encoding == disp_encoding_8bit)
7679 i.types[op].bitfield.disp8 = 1;
7680 else
7681 i.types[op].bitfield.disp32 = 1;
7682 }
7683 i.rm.mode = mode_from_disp_size (i.types[op]);
7684 }
7685 }
7686
7687 if (fake_zero_displacement)
7688 {
7689 /* Fakes a zero displacement assuming that i.types[op]
7690 holds the correct displacement size. */
7691 expressionS *exp;
7692
7693 gas_assert (i.op[op].disps == 0);
7694 exp = &disp_expressions[i.disp_operands++];
7695 i.op[op].disps = exp;
7696 exp->X_op = O_constant;
7697 exp->X_add_number = 0;
7698 exp->X_add_symbol = (symbolS *) 0;
7699 exp->X_op_symbol = (symbolS *) 0;
7700 }
7701
7702 mem = op;
7703 }
7704 else
7705 mem = ~0;
7706
7707 if (i.tm.opcode_modifier.vexsources == XOP2SOURCES)
7708 {
7709 if (operand_type_check (i.types[0], imm))
7710 i.vex.register_specifier = NULL;
7711 else
7712 {
7713 /* VEX.vvvv encodes one of the sources when the first
7714 operand is not an immediate. */
7715 if (i.tm.opcode_modifier.vexw == VEXW0)
7716 i.vex.register_specifier = i.op[0].regs;
7717 else
7718 i.vex.register_specifier = i.op[1].regs;
7719 }
7720
7721 /* Destination is a XMM register encoded in the ModRM.reg
7722 and VEX.R bit. */
7723 i.rm.reg = i.op[2].regs->reg_num;
7724 if ((i.op[2].regs->reg_flags & RegRex) != 0)
7725 i.rex |= REX_R;
7726
7727 /* ModRM.rm and VEX.B encodes the other source. */
7728 if (!i.mem_operands)
7729 {
7730 i.rm.mode = 3;
7731
7732 if (i.tm.opcode_modifier.vexw == VEXW0)
7733 i.rm.regmem = i.op[1].regs->reg_num;
7734 else
7735 i.rm.regmem = i.op[0].regs->reg_num;
7736
7737 if ((i.op[1].regs->reg_flags & RegRex) != 0)
7738 i.rex |= REX_B;
7739 }
7740 }
7741 else if (i.tm.opcode_modifier.vexvvvv == VEXLWP)
7742 {
7743 i.vex.register_specifier = i.op[2].regs;
7744 if (!i.mem_operands)
7745 {
7746 i.rm.mode = 3;
7747 i.rm.regmem = i.op[1].regs->reg_num;
7748 if ((i.op[1].regs->reg_flags & RegRex) != 0)
7749 i.rex |= REX_B;
7750 }
7751 }
7752 /* Fill in i.rm.reg or i.rm.regmem field with register operand
7753 (if any) based on i.tm.extension_opcode. Again, we must be
7754 careful to make sure that segment/control/debug/test/MMX
7755 registers are coded into the i.rm.reg field. */
7756 else if (i.reg_operands)
7757 {
7758 unsigned int op;
7759 unsigned int vex_reg = ~0;
7760
7761 for (op = 0; op < i.operands; op++)
7762 {
7763 if (i.types[op].bitfield.class == Reg
7764 || i.types[op].bitfield.class == RegBND
7765 || i.types[op].bitfield.class == RegMask
7766 || i.types[op].bitfield.class == SReg
7767 || i.types[op].bitfield.class == RegCR
7768 || i.types[op].bitfield.class == RegDR
7769 || i.types[op].bitfield.class == RegTR)
7770 break;
7771 if (i.types[op].bitfield.class == RegSIMD)
7772 {
7773 if (i.types[op].bitfield.zmmword)
7774 i.has_regzmm = TRUE;
7775 else if (i.types[op].bitfield.ymmword)
7776 i.has_regymm = TRUE;
7777 else
7778 i.has_regxmm = TRUE;
7779 break;
7780 }
7781 if (i.types[op].bitfield.class == RegMMX)
7782 {
7783 i.has_regmmx = TRUE;
7784 break;
7785 }
7786 }
7787
7788 if (vex_3_sources)
7789 op = dest;
7790 else if (i.tm.opcode_modifier.vexvvvv == VEXXDS)
7791 {
7792 /* For instructions with VexNDS, the register-only
7793 source operand is encoded in VEX prefix. */
7794 gas_assert (mem != (unsigned int) ~0);
7795
7796 if (op > mem)
7797 {
7798 vex_reg = op++;
7799 gas_assert (op < i.operands);
7800 }
7801 else
7802 {
7803 /* Check register-only source operand when two source
7804 operands are swapped. */
7805 if (!i.tm.operand_types[op].bitfield.baseindex
7806 && i.tm.operand_types[op + 1].bitfield.baseindex)
7807 {
7808 vex_reg = op;
7809 op += 2;
7810 gas_assert (mem == (vex_reg + 1)
7811 && op < i.operands);
7812 }
7813 else
7814 {
7815 vex_reg = op + 1;
7816 gas_assert (vex_reg < i.operands);
7817 }
7818 }
7819 }
7820 else if (i.tm.opcode_modifier.vexvvvv == VEXNDD)
7821 {
7822 /* For instructions with VexNDD, the register destination
7823 is encoded in VEX prefix. */
7824 if (i.mem_operands == 0)
7825 {
7826 /* There is no memory operand. */
7827 gas_assert ((op + 2) == i.operands);
7828 vex_reg = op + 1;
7829 }
7830 else
7831 {
7832 /* There are only 2 non-immediate operands. */
7833 gas_assert (op < i.imm_operands + 2
7834 && i.operands == i.imm_operands + 2);
7835 vex_reg = i.imm_operands + 1;
7836 }
7837 }
7838 else
7839 gas_assert (op < i.operands);
7840
7841 if (vex_reg != (unsigned int) ~0)
7842 {
7843 i386_operand_type *type = &i.tm.operand_types[vex_reg];
7844
7845 if ((type->bitfield.class != Reg
7846 || (!type->bitfield.dword && !type->bitfield.qword))
7847 && type->bitfield.class != RegSIMD
7848 && !operand_type_equal (type, &regmask))
7849 abort ();
7850
7851 i.vex.register_specifier = i.op[vex_reg].regs;
7852 }
7853
7854 /* Don't set OP operand twice. */
7855 if (vex_reg != op)
7856 {
7857 /* If there is an extension opcode to put here, the
7858 register number must be put into the regmem field. */
7859 if (i.tm.extension_opcode != None)
7860 {
7861 i.rm.regmem = i.op[op].regs->reg_num;
7862 if ((i.op[op].regs->reg_flags & RegRex) != 0)
7863 i.rex |= REX_B;
7864 if ((i.op[op].regs->reg_flags & RegVRex) != 0)
7865 i.vrex |= REX_B;
7866 }
7867 else
7868 {
7869 i.rm.reg = i.op[op].regs->reg_num;
7870 if ((i.op[op].regs->reg_flags & RegRex) != 0)
7871 i.rex |= REX_R;
7872 if ((i.op[op].regs->reg_flags & RegVRex) != 0)
7873 i.vrex |= REX_R;
7874 }
7875 }
7876
7877 /* Now, if no memory operand has set i.rm.mode = 0, 1, 2 we
7878 must set it to 3 to indicate this is a register operand
7879 in the regmem field. */
7880 if (!i.mem_operands)
7881 i.rm.mode = 3;
7882 }
7883
7884 /* Fill in i.rm.reg field with extension opcode (if any). */
7885 if (i.tm.extension_opcode != None)
7886 i.rm.reg = i.tm.extension_opcode;
7887 }
7888 return default_seg;
7889 }
7890
7891 static unsigned int
7892 flip_code16 (unsigned int code16)
7893 {
7894 gas_assert (i.tm.operands == 1);
7895
7896 return !(i.prefix[REX_PREFIX] & REX_W)
7897 && (code16 ? i.tm.operand_types[0].bitfield.disp32
7898 || i.tm.operand_types[0].bitfield.disp32s
7899 : i.tm.operand_types[0].bitfield.disp16)
7900 ? CODE16 : 0;
7901 }
7902
7903 static void
7904 output_branch (void)
7905 {
7906 char *p;
7907 int size;
7908 int code16;
7909 int prefix;
7910 relax_substateT subtype;
7911 symbolS *sym;
7912 offsetT off;
7913
7914 code16 = flag_code == CODE_16BIT ? CODE16 : 0;
7915 size = i.disp_encoding == disp_encoding_32bit ? BIG : SMALL;
7916
7917 prefix = 0;
7918 if (i.prefix[DATA_PREFIX] != 0)
7919 {
7920 prefix = 1;
7921 i.prefixes -= 1;
7922 code16 ^= flip_code16(code16);
7923 }
7924 /* Pentium4 branch hints. */
7925 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
7926 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
7927 {
7928 prefix++;
7929 i.prefixes--;
7930 }
7931 if (i.prefix[REX_PREFIX] != 0)
7932 {
7933 prefix++;
7934 i.prefixes--;
7935 }
7936
7937 /* BND prefixed jump. */
7938 if (i.prefix[BND_PREFIX] != 0)
7939 {
7940 prefix++;
7941 i.prefixes--;
7942 }
7943
7944 if (i.prefixes != 0)
7945 as_warn (_("skipping prefixes on `%s'"), i.tm.name);
7946
7947 /* It's always a symbol; End frag & setup for relax.
7948 Make sure there is enough room in this frag for the largest
7949 instruction we may generate in md_convert_frag. This is 2
7950 bytes for the opcode and room for the prefix and largest
7951 displacement. */
7952 frag_grow (prefix + 2 + 4);
7953 /* Prefix and 1 opcode byte go in fr_fix. */
7954 p = frag_more (prefix + 1);
7955 if (i.prefix[DATA_PREFIX] != 0)
7956 *p++ = DATA_PREFIX_OPCODE;
7957 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE
7958 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE)
7959 *p++ = i.prefix[SEG_PREFIX];
7960 if (i.prefix[BND_PREFIX] != 0)
7961 *p++ = BND_PREFIX_OPCODE;
7962 if (i.prefix[REX_PREFIX] != 0)
7963 *p++ = i.prefix[REX_PREFIX];
7964 *p = i.tm.base_opcode;
7965
7966 if ((unsigned char) *p == JUMP_PC_RELATIVE)
7967 subtype = ENCODE_RELAX_STATE (UNCOND_JUMP, size);
7968 else if (cpu_arch_flags.bitfield.cpui386)
7969 subtype = ENCODE_RELAX_STATE (COND_JUMP, size);
7970 else
7971 subtype = ENCODE_RELAX_STATE (COND_JUMP86, size);
7972 subtype |= code16;
7973
7974 sym = i.op[0].disps->X_add_symbol;
7975 off = i.op[0].disps->X_add_number;
7976
7977 if (i.op[0].disps->X_op != O_constant
7978 && i.op[0].disps->X_op != O_symbol)
7979 {
7980 /* Handle complex expressions. */
7981 sym = make_expr_symbol (i.op[0].disps);
7982 off = 0;
7983 }
7984
7985 /* 1 possible extra opcode + 4 byte displacement go in var part.
7986 Pass reloc in fr_var. */
7987 frag_var (rs_machine_dependent, 5, i.reloc[0], subtype, sym, off, p);
7988 }
7989
7990 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
7991 /* Return TRUE iff PLT32 relocation should be used for branching to
7992 symbol S. */
7993
7994 static bfd_boolean
7995 need_plt32_p (symbolS *s)
7996 {
7997 /* PLT32 relocation is ELF only. */
7998 if (!IS_ELF)
7999 return FALSE;
8000
8001 #ifdef TE_SOLARIS
8002 /* Don't emit PLT32 relocation on Solaris: neither native linker nor
8003 krtld support it. */
8004 return FALSE;
8005 #endif
8006
8007 /* Since there is no need to prepare for PLT branch on x86-64, we
8008 can generate R_X86_64_PLT32, instead of R_X86_64_PC32, which can
8009 be used as a marker for 32-bit PC-relative branches. */
8010 if (!object_64bit)
8011 return FALSE;
8012
8013 /* Weak or undefined symbol need PLT32 relocation. */
8014 if (S_IS_WEAK (s) || !S_IS_DEFINED (s))
8015 return TRUE;
8016
8017 /* Non-global symbol doesn't need PLT32 relocation. */
8018 if (! S_IS_EXTERNAL (s))
8019 return FALSE;
8020
8021 /* Other global symbols need PLT32 relocation. NB: Symbol with
8022 non-default visibilities are treated as normal global symbol
8023 so that PLT32 relocation can be used as a marker for 32-bit
8024 PC-relative branches. It is useful for linker relaxation. */
8025 return TRUE;
8026 }
8027 #endif
8028
8029 static void
8030 output_jump (void)
8031 {
8032 char *p;
8033 int size;
8034 fixS *fixP;
8035 bfd_reloc_code_real_type jump_reloc = i.reloc[0];
8036
8037 if (i.tm.opcode_modifier.jump == JUMP_BYTE)
8038 {
8039 /* This is a loop or jecxz type instruction. */
8040 size = 1;
8041 if (i.prefix[ADDR_PREFIX] != 0)
8042 {
8043 FRAG_APPEND_1_CHAR (ADDR_PREFIX_OPCODE);
8044 i.prefixes -= 1;
8045 }
8046 /* Pentium4 branch hints. */
8047 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
8048 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
8049 {
8050 FRAG_APPEND_1_CHAR (i.prefix[SEG_PREFIX]);
8051 i.prefixes--;
8052 }
8053 }
8054 else
8055 {
8056 int code16;
8057
8058 code16 = 0;
8059 if (flag_code == CODE_16BIT)
8060 code16 = CODE16;
8061
8062 if (i.prefix[DATA_PREFIX] != 0)
8063 {
8064 FRAG_APPEND_1_CHAR (DATA_PREFIX_OPCODE);
8065 i.prefixes -= 1;
8066 code16 ^= flip_code16(code16);
8067 }
8068
8069 size = 4;
8070 if (code16)
8071 size = 2;
8072 }
8073
8074 /* BND prefixed jump. */
8075 if (i.prefix[BND_PREFIX] != 0)
8076 {
8077 FRAG_APPEND_1_CHAR (i.prefix[BND_PREFIX]);
8078 i.prefixes -= 1;
8079 }
8080
8081 if (i.prefix[REX_PREFIX] != 0)
8082 {
8083 FRAG_APPEND_1_CHAR (i.prefix[REX_PREFIX]);
8084 i.prefixes -= 1;
8085 }
8086
8087 if (i.prefixes != 0)
8088 as_warn (_("skipping prefixes on `%s'"), i.tm.name);
8089
8090 p = frag_more (i.tm.opcode_length + size);
8091 switch (i.tm.opcode_length)
8092 {
8093 case 2:
8094 *p++ = i.tm.base_opcode >> 8;
8095 /* Fall through. */
8096 case 1:
8097 *p++ = i.tm.base_opcode;
8098 break;
8099 default:
8100 abort ();
8101 }
8102
8103 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8104 if (size == 4
8105 && jump_reloc == NO_RELOC
8106 && need_plt32_p (i.op[0].disps->X_add_symbol))
8107 jump_reloc = BFD_RELOC_X86_64_PLT32;
8108 #endif
8109
8110 jump_reloc = reloc (size, 1, 1, jump_reloc);
8111
8112 fixP = fix_new_exp (frag_now, p - frag_now->fr_literal, size,
8113 i.op[0].disps, 1, jump_reloc);
8114
8115 /* All jumps handled here are signed, but don't use a signed limit
8116 check for 32 and 16 bit jumps as we want to allow wrap around at
8117 4G and 64k respectively. */
8118 if (size == 1)
8119 fixP->fx_signed = 1;
8120 }
8121
8122 static void
8123 output_interseg_jump (void)
8124 {
8125 char *p;
8126 int size;
8127 int prefix;
8128 int code16;
8129
8130 code16 = 0;
8131 if (flag_code == CODE_16BIT)
8132 code16 = CODE16;
8133
8134 prefix = 0;
8135 if (i.prefix[DATA_PREFIX] != 0)
8136 {
8137 prefix = 1;
8138 i.prefixes -= 1;
8139 code16 ^= CODE16;
8140 }
8141
8142 gas_assert (!i.prefix[REX_PREFIX]);
8143
8144 size = 4;
8145 if (code16)
8146 size = 2;
8147
8148 if (i.prefixes != 0)
8149 as_warn (_("skipping prefixes on `%s'"), i.tm.name);
8150
8151 /* 1 opcode; 2 segment; offset */
8152 p = frag_more (prefix + 1 + 2 + size);
8153
8154 if (i.prefix[DATA_PREFIX] != 0)
8155 *p++ = DATA_PREFIX_OPCODE;
8156
8157 if (i.prefix[REX_PREFIX] != 0)
8158 *p++ = i.prefix[REX_PREFIX];
8159
8160 *p++ = i.tm.base_opcode;
8161 if (i.op[1].imms->X_op == O_constant)
8162 {
8163 offsetT n = i.op[1].imms->X_add_number;
8164
8165 if (size == 2
8166 && !fits_in_unsigned_word (n)
8167 && !fits_in_signed_word (n))
8168 {
8169 as_bad (_("16-bit jump out of range"));
8170 return;
8171 }
8172 md_number_to_chars (p, n, size);
8173 }
8174 else
8175 fix_new_exp (frag_now, p - frag_now->fr_literal, size,
8176 i.op[1].imms, 0, reloc (size, 0, 0, i.reloc[1]));
8177 if (i.op[0].imms->X_op != O_constant)
8178 as_bad (_("can't handle non absolute segment in `%s'"),
8179 i.tm.name);
8180 md_number_to_chars (p + size, (valueT) i.op[0].imms->X_add_number, 2);
8181 }
8182
8183 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8184 void
8185 x86_cleanup (void)
8186 {
8187 char *p;
8188 asection *seg = now_seg;
8189 subsegT subseg = now_subseg;
8190 asection *sec;
8191 unsigned int alignment, align_size_1;
8192 unsigned int isa_1_descsz, feature_2_descsz, descsz;
8193 unsigned int isa_1_descsz_raw, feature_2_descsz_raw;
8194 unsigned int padding;
8195
8196 if (!IS_ELF || !x86_used_note)
8197 return;
8198
8199 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_X86;
8200
8201 /* The .note.gnu.property section layout:
8202
8203 Field Length Contents
8204 ---- ---- ----
8205 n_namsz 4 4
8206 n_descsz 4 The note descriptor size
8207 n_type 4 NT_GNU_PROPERTY_TYPE_0
8208 n_name 4 "GNU"
8209 n_desc n_descsz The program property array
8210 .... .... ....
8211 */
8212
8213 /* Create the .note.gnu.property section. */
8214 sec = subseg_new (NOTE_GNU_PROPERTY_SECTION_NAME, 0);
8215 bfd_set_section_flags (sec,
8216 (SEC_ALLOC
8217 | SEC_LOAD
8218 | SEC_DATA
8219 | SEC_HAS_CONTENTS
8220 | SEC_READONLY));
8221
8222 if (get_elf_backend_data (stdoutput)->s->elfclass == ELFCLASS64)
8223 {
8224 align_size_1 = 7;
8225 alignment = 3;
8226 }
8227 else
8228 {
8229 align_size_1 = 3;
8230 alignment = 2;
8231 }
8232
8233 bfd_set_section_alignment (sec, alignment);
8234 elf_section_type (sec) = SHT_NOTE;
8235
8236 /* GNU_PROPERTY_X86_ISA_1_USED: 4-byte type + 4-byte data size
8237 + 4-byte data */
8238 isa_1_descsz_raw = 4 + 4 + 4;
8239 /* Align GNU_PROPERTY_X86_ISA_1_USED. */
8240 isa_1_descsz = (isa_1_descsz_raw + align_size_1) & ~align_size_1;
8241
8242 feature_2_descsz_raw = isa_1_descsz;
8243 /* GNU_PROPERTY_X86_FEATURE_2_USED: 4-byte type + 4-byte data size
8244 + 4-byte data */
8245 feature_2_descsz_raw += 4 + 4 + 4;
8246 /* Align GNU_PROPERTY_X86_FEATURE_2_USED. */
8247 feature_2_descsz = ((feature_2_descsz_raw + align_size_1)
8248 & ~align_size_1);
8249
8250 descsz = feature_2_descsz;
8251 /* Section size: n_namsz + n_descsz + n_type + n_name + n_descsz. */
8252 p = frag_more (4 + 4 + 4 + 4 + descsz);
8253
8254 /* Write n_namsz. */
8255 md_number_to_chars (p, (valueT) 4, 4);
8256
8257 /* Write n_descsz. */
8258 md_number_to_chars (p + 4, (valueT) descsz, 4);
8259
8260 /* Write n_type. */
8261 md_number_to_chars (p + 4 * 2, (valueT) NT_GNU_PROPERTY_TYPE_0, 4);
8262
8263 /* Write n_name. */
8264 memcpy (p + 4 * 3, "GNU", 4);
8265
8266 /* Write 4-byte type. */
8267 md_number_to_chars (p + 4 * 4,
8268 (valueT) GNU_PROPERTY_X86_ISA_1_USED, 4);
8269
8270 /* Write 4-byte data size. */
8271 md_number_to_chars (p + 4 * 5, (valueT) 4, 4);
8272
8273 /* Write 4-byte data. */
8274 md_number_to_chars (p + 4 * 6, (valueT) x86_isa_1_used, 4);
8275
8276 /* Zero out paddings. */
8277 padding = isa_1_descsz - isa_1_descsz_raw;
8278 if (padding)
8279 memset (p + 4 * 7, 0, padding);
8280
8281 /* Write 4-byte type. */
8282 md_number_to_chars (p + isa_1_descsz + 4 * 4,
8283 (valueT) GNU_PROPERTY_X86_FEATURE_2_USED, 4);
8284
8285 /* Write 4-byte data size. */
8286 md_number_to_chars (p + isa_1_descsz + 4 * 5, (valueT) 4, 4);
8287
8288 /* Write 4-byte data. */
8289 md_number_to_chars (p + isa_1_descsz + 4 * 6,
8290 (valueT) x86_feature_2_used, 4);
8291
8292 /* Zero out paddings. */
8293 padding = feature_2_descsz - feature_2_descsz_raw;
8294 if (padding)
8295 memset (p + isa_1_descsz + 4 * 7, 0, padding);
8296
8297 /* We probably can't restore the current segment, for there likely
8298 isn't one yet... */
8299 if (seg && subseg)
8300 subseg_set (seg, subseg);
8301 }
8302 #endif
8303
8304 static unsigned int
8305 encoding_length (const fragS *start_frag, offsetT start_off,
8306 const char *frag_now_ptr)
8307 {
8308 unsigned int len = 0;
8309
8310 if (start_frag != frag_now)
8311 {
8312 const fragS *fr = start_frag;
8313
8314 do {
8315 len += fr->fr_fix;
8316 fr = fr->fr_next;
8317 } while (fr && fr != frag_now);
8318 }
8319
8320 return len - start_off + (frag_now_ptr - frag_now->fr_literal);
8321 }
8322
8323 /* Return 1 for test, and, cmp, add, sub, inc and dec which may
8324 be macro-fused with conditional jumps. */
8325
8326 static int
8327 maybe_fused_with_jcc_p (void)
8328 {
8329 /* No RIP address. */
8330 if (i.base_reg && i.base_reg->reg_num == RegIP)
8331 return 0;
8332
8333 /* No VEX/EVEX encoding. */
8334 if (is_any_vex_encoding (&i.tm))
8335 return 0;
8336
8337 /* and, add, sub with destination register. */
8338 if ((i.tm.base_opcode >= 0x20 && i.tm.base_opcode <= 0x25)
8339 || i.tm.base_opcode <= 5
8340 || (i.tm.base_opcode >= 0x28 && i.tm.base_opcode <= 0x2d)
8341 || ((i.tm.base_opcode | 3) == 0x83
8342 && ((i.tm.extension_opcode | 1) == 0x5
8343 || i.tm.extension_opcode == 0x0)))
8344 return (i.types[1].bitfield.class == Reg
8345 || i.types[1].bitfield.instance == Accum);
8346
8347 /* test, cmp with any register. */
8348 if ((i.tm.base_opcode | 1) == 0x85
8349 || (i.tm.base_opcode | 1) == 0xa9
8350 || ((i.tm.base_opcode | 1) == 0xf7
8351 && i.tm.extension_opcode == 0)
8352 || (i.tm.base_opcode >= 0x38 && i.tm.base_opcode <= 0x3d)
8353 || ((i.tm.base_opcode | 3) == 0x83
8354 && (i.tm.extension_opcode == 0x7)))
8355 return (i.types[0].bitfield.class == Reg
8356 || i.types[0].bitfield.instance == Accum
8357 || i.types[1].bitfield.class == Reg
8358 || i.types[1].bitfield.instance == Accum);
8359
8360 /* inc, dec with any register. */
8361 if ((i.tm.cpu_flags.bitfield.cpuno64
8362 && (i.tm.base_opcode | 0xf) == 0x4f)
8363 || ((i.tm.base_opcode | 1) == 0xff
8364 && i.tm.extension_opcode <= 0x1))
8365 return (i.types[0].bitfield.class == Reg
8366 || i.types[0].bitfield.instance == Accum);
8367
8368 return 0;
8369 }
8370
8371 /* Return 1 if a FUSED_JCC_PADDING frag should be generated. */
8372
8373 static int
8374 add_fused_jcc_padding_frag_p (void)
8375 {
8376 /* NB: Don't work with COND_JUMP86 without i386. */
8377 if (!align_branch_power
8378 || now_seg == absolute_section
8379 || !cpu_arch_flags.bitfield.cpui386
8380 || !(align_branch & align_branch_fused_bit))
8381 return 0;
8382
8383 if (maybe_fused_with_jcc_p ())
8384 {
8385 if (last_insn.kind == last_insn_other
8386 || last_insn.seg != now_seg)
8387 return 1;
8388 if (flag_debug)
8389 as_warn_where (last_insn.file, last_insn.line,
8390 _("`%s` skips -malign-branch-boundary on `%s`"),
8391 last_insn.name, i.tm.name);
8392 }
8393
8394 return 0;
8395 }
8396
8397 /* Return 1 if a BRANCH_PREFIX frag should be generated. */
8398
8399 static int
8400 add_branch_prefix_frag_p (void)
8401 {
8402 /* NB: Don't work with COND_JUMP86 without i386. Don't add prefix
8403 to PadLock instructions since they include prefixes in opcode. */
8404 if (!align_branch_power
8405 || !align_branch_prefix_size
8406 || now_seg == absolute_section
8407 || i.tm.cpu_flags.bitfield.cpupadlock
8408 || !cpu_arch_flags.bitfield.cpui386)
8409 return 0;
8410
8411 /* Don't add prefix if it is a prefix or there is no operand in case
8412 that segment prefix is special. */
8413 if (!i.operands || i.tm.opcode_modifier.isprefix)
8414 return 0;
8415
8416 if (last_insn.kind == last_insn_other
8417 || last_insn.seg != now_seg)
8418 return 1;
8419
8420 if (flag_debug)
8421 as_warn_where (last_insn.file, last_insn.line,
8422 _("`%s` skips -malign-branch-boundary on `%s`"),
8423 last_insn.name, i.tm.name);
8424
8425 return 0;
8426 }
8427
8428 /* Return 1 if a BRANCH_PADDING frag should be generated. */
8429
8430 static int
8431 add_branch_padding_frag_p (enum align_branch_kind *branch_p)
8432 {
8433 int add_padding;
8434
8435 /* NB: Don't work with COND_JUMP86 without i386. */
8436 if (!align_branch_power
8437 || now_seg == absolute_section
8438 || !cpu_arch_flags.bitfield.cpui386)
8439 return 0;
8440
8441 add_padding = 0;
8442
8443 /* Check for jcc and direct jmp. */
8444 if (i.tm.opcode_modifier.jump == JUMP)
8445 {
8446 if (i.tm.base_opcode == JUMP_PC_RELATIVE)
8447 {
8448 *branch_p = align_branch_jmp;
8449 add_padding = align_branch & align_branch_jmp_bit;
8450 }
8451 else
8452 {
8453 *branch_p = align_branch_jcc;
8454 if ((align_branch & align_branch_jcc_bit))
8455 add_padding = 1;
8456 }
8457 }
8458 else if (is_any_vex_encoding (&i.tm))
8459 return 0;
8460 else if ((i.tm.base_opcode | 1) == 0xc3)
8461 {
8462 /* Near ret. */
8463 *branch_p = align_branch_ret;
8464 if ((align_branch & align_branch_ret_bit))
8465 add_padding = 1;
8466 }
8467 else
8468 {
8469 /* Check for indirect jmp, direct and indirect calls. */
8470 if (i.tm.base_opcode == 0xe8)
8471 {
8472 /* Direct call. */
8473 *branch_p = align_branch_call;
8474 if ((align_branch & align_branch_call_bit))
8475 add_padding = 1;
8476 }
8477 else if (i.tm.base_opcode == 0xff
8478 && (i.tm.extension_opcode == 2
8479 || i.tm.extension_opcode == 4))
8480 {
8481 /* Indirect call and jmp. */
8482 *branch_p = align_branch_indirect;
8483 if ((align_branch & align_branch_indirect_bit))
8484 add_padding = 1;
8485 }
8486
8487 if (add_padding
8488 && i.disp_operands
8489 && tls_get_addr
8490 && (i.op[0].disps->X_op == O_symbol
8491 || (i.op[0].disps->X_op == O_subtract
8492 && i.op[0].disps->X_op_symbol == GOT_symbol)))
8493 {
8494 symbolS *s = i.op[0].disps->X_add_symbol;
8495 /* No padding to call to global or undefined tls_get_addr. */
8496 if ((S_IS_EXTERNAL (s) || !S_IS_DEFINED (s))
8497 && strcmp (S_GET_NAME (s), tls_get_addr) == 0)
8498 return 0;
8499 }
8500 }
8501
8502 if (add_padding
8503 && last_insn.kind != last_insn_other
8504 && last_insn.seg == now_seg)
8505 {
8506 if (flag_debug)
8507 as_warn_where (last_insn.file, last_insn.line,
8508 _("`%s` skips -malign-branch-boundary on `%s`"),
8509 last_insn.name, i.tm.name);
8510 return 0;
8511 }
8512
8513 return add_padding;
8514 }
8515
8516 static void
8517 output_insn (void)
8518 {
8519 fragS *insn_start_frag;
8520 offsetT insn_start_off;
8521 fragS *fragP = NULL;
8522 enum align_branch_kind branch = align_branch_none;
8523
8524 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8525 if (IS_ELF && x86_used_note)
8526 {
8527 if (i.tm.cpu_flags.bitfield.cpucmov)
8528 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_CMOV;
8529 if (i.tm.cpu_flags.bitfield.cpusse)
8530 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE;
8531 if (i.tm.cpu_flags.bitfield.cpusse2)
8532 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE2;
8533 if (i.tm.cpu_flags.bitfield.cpusse3)
8534 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE3;
8535 if (i.tm.cpu_flags.bitfield.cpussse3)
8536 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSSE3;
8537 if (i.tm.cpu_flags.bitfield.cpusse4_1)
8538 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE4_1;
8539 if (i.tm.cpu_flags.bitfield.cpusse4_2)
8540 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE4_2;
8541 if (i.tm.cpu_flags.bitfield.cpuavx)
8542 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX;
8543 if (i.tm.cpu_flags.bitfield.cpuavx2)
8544 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX2;
8545 if (i.tm.cpu_flags.bitfield.cpufma)
8546 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_FMA;
8547 if (i.tm.cpu_flags.bitfield.cpuavx512f)
8548 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512F;
8549 if (i.tm.cpu_flags.bitfield.cpuavx512cd)
8550 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512CD;
8551 if (i.tm.cpu_flags.bitfield.cpuavx512er)
8552 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512ER;
8553 if (i.tm.cpu_flags.bitfield.cpuavx512pf)
8554 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512PF;
8555 if (i.tm.cpu_flags.bitfield.cpuavx512vl)
8556 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512VL;
8557 if (i.tm.cpu_flags.bitfield.cpuavx512dq)
8558 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512DQ;
8559 if (i.tm.cpu_flags.bitfield.cpuavx512bw)
8560 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512BW;
8561 if (i.tm.cpu_flags.bitfield.cpuavx512_4fmaps)
8562 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_4FMAPS;
8563 if (i.tm.cpu_flags.bitfield.cpuavx512_4vnniw)
8564 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_4VNNIW;
8565 if (i.tm.cpu_flags.bitfield.cpuavx512_bitalg)
8566 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_BITALG;
8567 if (i.tm.cpu_flags.bitfield.cpuavx512ifma)
8568 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_IFMA;
8569 if (i.tm.cpu_flags.bitfield.cpuavx512vbmi)
8570 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_VBMI;
8571 if (i.tm.cpu_flags.bitfield.cpuavx512_vbmi2)
8572 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_VBMI2;
8573 if (i.tm.cpu_flags.bitfield.cpuavx512_vnni)
8574 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_VNNI;
8575 if (i.tm.cpu_flags.bitfield.cpuavx512_bf16)
8576 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_BF16;
8577
8578 if (i.tm.cpu_flags.bitfield.cpu8087
8579 || i.tm.cpu_flags.bitfield.cpu287
8580 || i.tm.cpu_flags.bitfield.cpu387
8581 || i.tm.cpu_flags.bitfield.cpu687
8582 || i.tm.cpu_flags.bitfield.cpufisttp)
8583 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_X87;
8584 if (i.has_regmmx
8585 || i.tm.base_opcode == 0xf77 /* emms */
8586 || i.tm.base_opcode == 0xf0e /* femms */)
8587 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_MMX;
8588 if (i.has_regxmm)
8589 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XMM;
8590 if (i.has_regymm)
8591 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_YMM;
8592 if (i.has_regzmm)
8593 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_ZMM;
8594 if (i.tm.cpu_flags.bitfield.cpufxsr)
8595 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_FXSR;
8596 if (i.tm.cpu_flags.bitfield.cpuxsave)
8597 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVE;
8598 if (i.tm.cpu_flags.bitfield.cpuxsaveopt)
8599 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVEOPT;
8600 if (i.tm.cpu_flags.bitfield.cpuxsavec)
8601 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVEC;
8602 }
8603 #endif
8604
8605 /* Tie dwarf2 debug info to the address at the start of the insn.
8606 We can't do this after the insn has been output as the current
8607 frag may have been closed off. eg. by frag_var. */
8608 dwarf2_emit_insn (0);
8609
8610 insn_start_frag = frag_now;
8611 insn_start_off = frag_now_fix ();
8612
8613 if (add_branch_padding_frag_p (&branch))
8614 {
8615 char *p;
8616 /* Branch can be 8 bytes. Leave some room for prefixes. */
8617 unsigned int max_branch_padding_size = 14;
8618
8619 /* Align section to boundary. */
8620 record_alignment (now_seg, align_branch_power);
8621
8622 /* Make room for padding. */
8623 frag_grow (max_branch_padding_size);
8624
8625 /* Start of the padding. */
8626 p = frag_more (0);
8627
8628 fragP = frag_now;
8629
8630 frag_var (rs_machine_dependent, max_branch_padding_size, 0,
8631 ENCODE_RELAX_STATE (BRANCH_PADDING, 0),
8632 NULL, 0, p);
8633
8634 fragP->tc_frag_data.branch_type = branch;
8635 fragP->tc_frag_data.max_bytes = max_branch_padding_size;
8636 }
8637
8638 /* Output jumps. */
8639 if (i.tm.opcode_modifier.jump == JUMP)
8640 output_branch ();
8641 else if (i.tm.opcode_modifier.jump == JUMP_BYTE
8642 || i.tm.opcode_modifier.jump == JUMP_DWORD)
8643 output_jump ();
8644 else if (i.tm.opcode_modifier.jump == JUMP_INTERSEGMENT)
8645 output_interseg_jump ();
8646 else
8647 {
8648 /* Output normal instructions here. */
8649 char *p;
8650 unsigned char *q;
8651 unsigned int j;
8652 unsigned int prefix;
8653
8654 if (avoid_fence
8655 && (i.tm.base_opcode == 0xfaee8
8656 || i.tm.base_opcode == 0xfaef0
8657 || i.tm.base_opcode == 0xfaef8))
8658 {
8659 /* Encode lfence, mfence, and sfence as
8660 f0 83 04 24 00 lock addl $0x0, (%{re}sp). */
8661 offsetT val = 0x240483f0ULL;
8662 p = frag_more (5);
8663 md_number_to_chars (p, val, 5);
8664 return;
8665 }
8666
8667 /* Some processors fail on LOCK prefix. This options makes
8668 assembler ignore LOCK prefix and serves as a workaround. */
8669 if (omit_lock_prefix)
8670 {
8671 if (i.tm.base_opcode == LOCK_PREFIX_OPCODE)
8672 return;
8673 i.prefix[LOCK_PREFIX] = 0;
8674 }
8675
8676 if (branch)
8677 /* Skip if this is a branch. */
8678 ;
8679 else if (add_fused_jcc_padding_frag_p ())
8680 {
8681 /* Make room for padding. */
8682 frag_grow (MAX_FUSED_JCC_PADDING_SIZE);
8683 p = frag_more (0);
8684
8685 fragP = frag_now;
8686
8687 frag_var (rs_machine_dependent, MAX_FUSED_JCC_PADDING_SIZE, 0,
8688 ENCODE_RELAX_STATE (FUSED_JCC_PADDING, 0),
8689 NULL, 0, p);
8690
8691 fragP->tc_frag_data.branch_type = align_branch_fused;
8692 fragP->tc_frag_data.max_bytes = MAX_FUSED_JCC_PADDING_SIZE;
8693 }
8694 else if (add_branch_prefix_frag_p ())
8695 {
8696 unsigned int max_prefix_size = align_branch_prefix_size;
8697
8698 /* Make room for padding. */
8699 frag_grow (max_prefix_size);
8700 p = frag_more (0);
8701
8702 fragP = frag_now;
8703
8704 frag_var (rs_machine_dependent, max_prefix_size, 0,
8705 ENCODE_RELAX_STATE (BRANCH_PREFIX, 0),
8706 NULL, 0, p);
8707
8708 fragP->tc_frag_data.max_bytes = max_prefix_size;
8709 }
8710
8711 /* Since the VEX/EVEX prefix contains the implicit prefix, we
8712 don't need the explicit prefix. */
8713 if (!i.tm.opcode_modifier.vex && !i.tm.opcode_modifier.evex)
8714 {
8715 switch (i.tm.opcode_length)
8716 {
8717 case 3:
8718 if (i.tm.base_opcode & 0xff000000)
8719 {
8720 prefix = (i.tm.base_opcode >> 24) & 0xff;
8721 if (!i.tm.cpu_flags.bitfield.cpupadlock
8722 || prefix != REPE_PREFIX_OPCODE
8723 || (i.prefix[REP_PREFIX] != REPE_PREFIX_OPCODE))
8724 add_prefix (prefix);
8725 }
8726 break;
8727 case 2:
8728 if ((i.tm.base_opcode & 0xff0000) != 0)
8729 {
8730 prefix = (i.tm.base_opcode >> 16) & 0xff;
8731 add_prefix (prefix);
8732 }
8733 break;
8734 case 1:
8735 break;
8736 case 0:
8737 /* Check for pseudo prefixes. */
8738 as_bad_where (insn_start_frag->fr_file,
8739 insn_start_frag->fr_line,
8740 _("pseudo prefix without instruction"));
8741 return;
8742 default:
8743 abort ();
8744 }
8745
8746 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
8747 /* For x32, add a dummy REX_OPCODE prefix for mov/add with
8748 R_X86_64_GOTTPOFF relocation so that linker can safely
8749 perform IE->LE optimization. A dummy REX_OPCODE prefix
8750 is also needed for lea with R_X86_64_GOTPC32_TLSDESC
8751 relocation for GDesc -> IE/LE optimization. */
8752 if (x86_elf_abi == X86_64_X32_ABI
8753 && i.operands == 2
8754 && (i.reloc[0] == BFD_RELOC_X86_64_GOTTPOFF
8755 || i.reloc[0] == BFD_RELOC_X86_64_GOTPC32_TLSDESC)
8756 && i.prefix[REX_PREFIX] == 0)
8757 add_prefix (REX_OPCODE);
8758 #endif
8759
8760 /* The prefix bytes. */
8761 for (j = ARRAY_SIZE (i.prefix), q = i.prefix; j > 0; j--, q++)
8762 if (*q)
8763 FRAG_APPEND_1_CHAR (*q);
8764 }
8765 else
8766 {
8767 for (j = 0, q = i.prefix; j < ARRAY_SIZE (i.prefix); j++, q++)
8768 if (*q)
8769 switch (j)
8770 {
8771 case REX_PREFIX:
8772 /* REX byte is encoded in VEX prefix. */
8773 break;
8774 case SEG_PREFIX:
8775 case ADDR_PREFIX:
8776 FRAG_APPEND_1_CHAR (*q);
8777 break;
8778 default:
8779 /* There should be no other prefixes for instructions
8780 with VEX prefix. */
8781 abort ();
8782 }
8783
8784 /* For EVEX instructions i.vrex should become 0 after
8785 build_evex_prefix. For VEX instructions upper 16 registers
8786 aren't available, so VREX should be 0. */
8787 if (i.vrex)
8788 abort ();
8789 /* Now the VEX prefix. */
8790 p = frag_more (i.vex.length);
8791 for (j = 0; j < i.vex.length; j++)
8792 p[j] = i.vex.bytes[j];
8793 }
8794
8795 /* Now the opcode; be careful about word order here! */
8796 if (i.tm.opcode_length == 1)
8797 {
8798 FRAG_APPEND_1_CHAR (i.tm.base_opcode);
8799 }
8800 else
8801 {
8802 switch (i.tm.opcode_length)
8803 {
8804 case 4:
8805 p = frag_more (4);
8806 *p++ = (i.tm.base_opcode >> 24) & 0xff;
8807 *p++ = (i.tm.base_opcode >> 16) & 0xff;
8808 break;
8809 case 3:
8810 p = frag_more (3);
8811 *p++ = (i.tm.base_opcode >> 16) & 0xff;
8812 break;
8813 case 2:
8814 p = frag_more (2);
8815 break;
8816 default:
8817 abort ();
8818 break;
8819 }
8820
8821 /* Put out high byte first: can't use md_number_to_chars! */
8822 *p++ = (i.tm.base_opcode >> 8) & 0xff;
8823 *p = i.tm.base_opcode & 0xff;
8824 }
8825
8826 /* Now the modrm byte and sib byte (if present). */
8827 if (i.tm.opcode_modifier.modrm)
8828 {
8829 FRAG_APPEND_1_CHAR ((i.rm.regmem << 0
8830 | i.rm.reg << 3
8831 | i.rm.mode << 6));
8832 /* If i.rm.regmem == ESP (4)
8833 && i.rm.mode != (Register mode)
8834 && not 16 bit
8835 ==> need second modrm byte. */
8836 if (i.rm.regmem == ESCAPE_TO_TWO_BYTE_ADDRESSING
8837 && i.rm.mode != 3
8838 && !(i.base_reg && i.base_reg->reg_type.bitfield.word))
8839 FRAG_APPEND_1_CHAR ((i.sib.base << 0
8840 | i.sib.index << 3
8841 | i.sib.scale << 6));
8842 }
8843
8844 if (i.disp_operands)
8845 output_disp (insn_start_frag, insn_start_off);
8846
8847 if (i.imm_operands)
8848 output_imm (insn_start_frag, insn_start_off);
8849
8850 /*
8851 * frag_now_fix () returning plain abs_section_offset when we're in the
8852 * absolute section, and abs_section_offset not getting updated as data
8853 * gets added to the frag breaks the logic below.
8854 */
8855 if (now_seg != absolute_section)
8856 {
8857 j = encoding_length (insn_start_frag, insn_start_off, frag_more (0));
8858 if (j > 15)
8859 as_warn (_("instruction length of %u bytes exceeds the limit of 15"),
8860 j);
8861 else if (fragP)
8862 {
8863 /* NB: Don't add prefix with GOTPC relocation since
8864 output_disp() above depends on the fixed encoding
8865 length. Can't add prefix with TLS relocation since
8866 it breaks TLS linker optimization. */
8867 unsigned int max = i.has_gotpc_tls_reloc ? 0 : 15 - j;
8868 /* Prefix count on the current instruction. */
8869 unsigned int count = i.vex.length;
8870 unsigned int k;
8871 for (k = 0; k < ARRAY_SIZE (i.prefix); k++)
8872 /* REX byte is encoded in VEX/EVEX prefix. */
8873 if (i.prefix[k] && (k != REX_PREFIX || !i.vex.length))
8874 count++;
8875
8876 /* Count prefixes for extended opcode maps. */
8877 if (!i.vex.length)
8878 switch (i.tm.opcode_length)
8879 {
8880 case 3:
8881 if (((i.tm.base_opcode >> 16) & 0xff) == 0xf)
8882 {
8883 count++;
8884 switch ((i.tm.base_opcode >> 8) & 0xff)
8885 {
8886 case 0x38:
8887 case 0x3a:
8888 count++;
8889 break;
8890 default:
8891 break;
8892 }
8893 }
8894 break;
8895 case 2:
8896 if (((i.tm.base_opcode >> 8) & 0xff) == 0xf)
8897 count++;
8898 break;
8899 case 1:
8900 break;
8901 default:
8902 abort ();
8903 }
8904
8905 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
8906 == BRANCH_PREFIX)
8907 {
8908 /* Set the maximum prefix size in BRANCH_PREFIX
8909 frag. */
8910 if (fragP->tc_frag_data.max_bytes > max)
8911 fragP->tc_frag_data.max_bytes = max;
8912 if (fragP->tc_frag_data.max_bytes > count)
8913 fragP->tc_frag_data.max_bytes -= count;
8914 else
8915 fragP->tc_frag_data.max_bytes = 0;
8916 }
8917 else
8918 {
8919 /* Remember the maximum prefix size in FUSED_JCC_PADDING
8920 frag. */
8921 unsigned int max_prefix_size;
8922 if (align_branch_prefix_size > max)
8923 max_prefix_size = max;
8924 else
8925 max_prefix_size = align_branch_prefix_size;
8926 if (max_prefix_size > count)
8927 fragP->tc_frag_data.max_prefix_length
8928 = max_prefix_size - count;
8929 }
8930
8931 /* Use existing segment prefix if possible. Use CS
8932 segment prefix in 64-bit mode. In 32-bit mode, use SS
8933 segment prefix with ESP/EBP base register and use DS
8934 segment prefix without ESP/EBP base register. */
8935 if (i.prefix[SEG_PREFIX])
8936 fragP->tc_frag_data.default_prefix = i.prefix[SEG_PREFIX];
8937 else if (flag_code == CODE_64BIT)
8938 fragP->tc_frag_data.default_prefix = CS_PREFIX_OPCODE;
8939 else if (i.base_reg
8940 && (i.base_reg->reg_num == 4
8941 || i.base_reg->reg_num == 5))
8942 fragP->tc_frag_data.default_prefix = SS_PREFIX_OPCODE;
8943 else
8944 fragP->tc_frag_data.default_prefix = DS_PREFIX_OPCODE;
8945 }
8946 }
8947 }
8948
8949 /* NB: Don't work with COND_JUMP86 without i386. */
8950 if (align_branch_power
8951 && now_seg != absolute_section
8952 && cpu_arch_flags.bitfield.cpui386)
8953 {
8954 /* Terminate each frag so that we can add prefix and check for
8955 fused jcc. */
8956 frag_wane (frag_now);
8957 frag_new (0);
8958 }
8959
8960 #ifdef DEBUG386
8961 if (flag_debug)
8962 {
8963 pi ("" /*line*/, &i);
8964 }
8965 #endif /* DEBUG386 */
8966 }
8967
8968 /* Return the size of the displacement operand N. */
8969
8970 static int
8971 disp_size (unsigned int n)
8972 {
8973 int size = 4;
8974
8975 if (i.types[n].bitfield.disp64)
8976 size = 8;
8977 else if (i.types[n].bitfield.disp8)
8978 size = 1;
8979 else if (i.types[n].bitfield.disp16)
8980 size = 2;
8981 return size;
8982 }
8983
8984 /* Return the size of the immediate operand N. */
8985
8986 static int
8987 imm_size (unsigned int n)
8988 {
8989 int size = 4;
8990 if (i.types[n].bitfield.imm64)
8991 size = 8;
8992 else if (i.types[n].bitfield.imm8 || i.types[n].bitfield.imm8s)
8993 size = 1;
8994 else if (i.types[n].bitfield.imm16)
8995 size = 2;
8996 return size;
8997 }
8998
8999 static void
9000 output_disp (fragS *insn_start_frag, offsetT insn_start_off)
9001 {
9002 char *p;
9003 unsigned int n;
9004
9005 for (n = 0; n < i.operands; n++)
9006 {
9007 if (operand_type_check (i.types[n], disp))
9008 {
9009 if (i.op[n].disps->X_op == O_constant)
9010 {
9011 int size = disp_size (n);
9012 offsetT val = i.op[n].disps->X_add_number;
9013
9014 val = offset_in_range (val >> (size == 1 ? i.memshift : 0),
9015 size);
9016 p = frag_more (size);
9017 md_number_to_chars (p, val, size);
9018 }
9019 else
9020 {
9021 enum bfd_reloc_code_real reloc_type;
9022 int size = disp_size (n);
9023 int sign = i.types[n].bitfield.disp32s;
9024 int pcrel = (i.flags[n] & Operand_PCrel) != 0;
9025 fixS *fixP;
9026
9027 /* We can't have 8 bit displacement here. */
9028 gas_assert (!i.types[n].bitfield.disp8);
9029
9030 /* The PC relative address is computed relative
9031 to the instruction boundary, so in case immediate
9032 fields follows, we need to adjust the value. */
9033 if (pcrel && i.imm_operands)
9034 {
9035 unsigned int n1;
9036 int sz = 0;
9037
9038 for (n1 = 0; n1 < i.operands; n1++)
9039 if (operand_type_check (i.types[n1], imm))
9040 {
9041 /* Only one immediate is allowed for PC
9042 relative address. */
9043 gas_assert (sz == 0);
9044 sz = imm_size (n1);
9045 i.op[n].disps->X_add_number -= sz;
9046 }
9047 /* We should find the immediate. */
9048 gas_assert (sz != 0);
9049 }
9050
9051 p = frag_more (size);
9052 reloc_type = reloc (size, pcrel, sign, i.reloc[n]);
9053 if (GOT_symbol
9054 && GOT_symbol == i.op[n].disps->X_add_symbol
9055 && (((reloc_type == BFD_RELOC_32
9056 || reloc_type == BFD_RELOC_X86_64_32S
9057 || (reloc_type == BFD_RELOC_64
9058 && object_64bit))
9059 && (i.op[n].disps->X_op == O_symbol
9060 || (i.op[n].disps->X_op == O_add
9061 && ((symbol_get_value_expression
9062 (i.op[n].disps->X_op_symbol)->X_op)
9063 == O_subtract))))
9064 || reloc_type == BFD_RELOC_32_PCREL))
9065 {
9066 if (!object_64bit)
9067 {
9068 reloc_type = BFD_RELOC_386_GOTPC;
9069 i.has_gotpc_tls_reloc = TRUE;
9070 i.op[n].imms->X_add_number +=
9071 encoding_length (insn_start_frag, insn_start_off, p);
9072 }
9073 else if (reloc_type == BFD_RELOC_64)
9074 reloc_type = BFD_RELOC_X86_64_GOTPC64;
9075 else
9076 /* Don't do the adjustment for x86-64, as there
9077 the pcrel addressing is relative to the _next_
9078 insn, and that is taken care of in other code. */
9079 reloc_type = BFD_RELOC_X86_64_GOTPC32;
9080 }
9081 else if (align_branch_power)
9082 {
9083 switch (reloc_type)
9084 {
9085 case BFD_RELOC_386_TLS_GD:
9086 case BFD_RELOC_386_TLS_LDM:
9087 case BFD_RELOC_386_TLS_IE:
9088 case BFD_RELOC_386_TLS_IE_32:
9089 case BFD_RELOC_386_TLS_GOTIE:
9090 case BFD_RELOC_386_TLS_GOTDESC:
9091 case BFD_RELOC_386_TLS_DESC_CALL:
9092 case BFD_RELOC_X86_64_TLSGD:
9093 case BFD_RELOC_X86_64_TLSLD:
9094 case BFD_RELOC_X86_64_GOTTPOFF:
9095 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
9096 case BFD_RELOC_X86_64_TLSDESC_CALL:
9097 i.has_gotpc_tls_reloc = TRUE;
9098 default:
9099 break;
9100 }
9101 }
9102 fixP = fix_new_exp (frag_now, p - frag_now->fr_literal,
9103 size, i.op[n].disps, pcrel,
9104 reloc_type);
9105 /* Check for "call/jmp *mem", "mov mem, %reg",
9106 "test %reg, mem" and "binop mem, %reg" where binop
9107 is one of adc, add, and, cmp, or, sbb, sub, xor
9108 instructions without data prefix. Always generate
9109 R_386_GOT32X for "sym*GOT" operand in 32-bit mode. */
9110 if (i.prefix[DATA_PREFIX] == 0
9111 && (generate_relax_relocations
9112 || (!object_64bit
9113 && i.rm.mode == 0
9114 && i.rm.regmem == 5))
9115 && (i.rm.mode == 2
9116 || (i.rm.mode == 0 && i.rm.regmem == 5))
9117 && !is_any_vex_encoding(&i.tm)
9118 && ((i.operands == 1
9119 && i.tm.base_opcode == 0xff
9120 && (i.rm.reg == 2 || i.rm.reg == 4))
9121 || (i.operands == 2
9122 && (i.tm.base_opcode == 0x8b
9123 || i.tm.base_opcode == 0x85
9124 || (i.tm.base_opcode & ~0x38) == 0x03))))
9125 {
9126 if (object_64bit)
9127 {
9128 fixP->fx_tcbit = i.rex != 0;
9129 if (i.base_reg
9130 && (i.base_reg->reg_num == RegIP))
9131 fixP->fx_tcbit2 = 1;
9132 }
9133 else
9134 fixP->fx_tcbit2 = 1;
9135 }
9136 }
9137 }
9138 }
9139 }
9140
9141 static void
9142 output_imm (fragS *insn_start_frag, offsetT insn_start_off)
9143 {
9144 char *p;
9145 unsigned int n;
9146
9147 for (n = 0; n < i.operands; n++)
9148 {
9149 /* Skip SAE/RC Imm operand in EVEX. They are already handled. */
9150 if (i.rounding && (int) n == i.rounding->operand)
9151 continue;
9152
9153 if (operand_type_check (i.types[n], imm))
9154 {
9155 if (i.op[n].imms->X_op == O_constant)
9156 {
9157 int size = imm_size (n);
9158 offsetT val;
9159
9160 val = offset_in_range (i.op[n].imms->X_add_number,
9161 size);
9162 p = frag_more (size);
9163 md_number_to_chars (p, val, size);
9164 }
9165 else
9166 {
9167 /* Not absolute_section.
9168 Need a 32-bit fixup (don't support 8bit
9169 non-absolute imms). Try to support other
9170 sizes ... */
9171 enum bfd_reloc_code_real reloc_type;
9172 int size = imm_size (n);
9173 int sign;
9174
9175 if (i.types[n].bitfield.imm32s
9176 && (i.suffix == QWORD_MNEM_SUFFIX
9177 || (!i.suffix && i.tm.opcode_modifier.no_lsuf)))
9178 sign = 1;
9179 else
9180 sign = 0;
9181
9182 p = frag_more (size);
9183 reloc_type = reloc (size, 0, sign, i.reloc[n]);
9184
9185 /* This is tough to explain. We end up with this one if we
9186 * have operands that look like
9187 * "_GLOBAL_OFFSET_TABLE_+[.-.L284]". The goal here is to
9188 * obtain the absolute address of the GOT, and it is strongly
9189 * preferable from a performance point of view to avoid using
9190 * a runtime relocation for this. The actual sequence of
9191 * instructions often look something like:
9192 *
9193 * call .L66
9194 * .L66:
9195 * popl %ebx
9196 * addl $_GLOBAL_OFFSET_TABLE_+[.-.L66],%ebx
9197 *
9198 * The call and pop essentially return the absolute address
9199 * of the label .L66 and store it in %ebx. The linker itself
9200 * will ultimately change the first operand of the addl so
9201 * that %ebx points to the GOT, but to keep things simple, the
9202 * .o file must have this operand set so that it generates not
9203 * the absolute address of .L66, but the absolute address of
9204 * itself. This allows the linker itself simply treat a GOTPC
9205 * relocation as asking for a pcrel offset to the GOT to be
9206 * added in, and the addend of the relocation is stored in the
9207 * operand field for the instruction itself.
9208 *
9209 * Our job here is to fix the operand so that it would add
9210 * the correct offset so that %ebx would point to itself. The
9211 * thing that is tricky is that .-.L66 will point to the
9212 * beginning of the instruction, so we need to further modify
9213 * the operand so that it will point to itself. There are
9214 * other cases where you have something like:
9215 *
9216 * .long $_GLOBAL_OFFSET_TABLE_+[.-.L66]
9217 *
9218 * and here no correction would be required. Internally in
9219 * the assembler we treat operands of this form as not being
9220 * pcrel since the '.' is explicitly mentioned, and I wonder
9221 * whether it would simplify matters to do it this way. Who
9222 * knows. In earlier versions of the PIC patches, the
9223 * pcrel_adjust field was used to store the correction, but
9224 * since the expression is not pcrel, I felt it would be
9225 * confusing to do it this way. */
9226
9227 if ((reloc_type == BFD_RELOC_32
9228 || reloc_type == BFD_RELOC_X86_64_32S
9229 || reloc_type == BFD_RELOC_64)
9230 && GOT_symbol
9231 && GOT_symbol == i.op[n].imms->X_add_symbol
9232 && (i.op[n].imms->X_op == O_symbol
9233 || (i.op[n].imms->X_op == O_add
9234 && ((symbol_get_value_expression
9235 (i.op[n].imms->X_op_symbol)->X_op)
9236 == O_subtract))))
9237 {
9238 if (!object_64bit)
9239 reloc_type = BFD_RELOC_386_GOTPC;
9240 else if (size == 4)
9241 reloc_type = BFD_RELOC_X86_64_GOTPC32;
9242 else if (size == 8)
9243 reloc_type = BFD_RELOC_X86_64_GOTPC64;
9244 i.has_gotpc_tls_reloc = TRUE;
9245 i.op[n].imms->X_add_number +=
9246 encoding_length (insn_start_frag, insn_start_off, p);
9247 }
9248 fix_new_exp (frag_now, p - frag_now->fr_literal, size,
9249 i.op[n].imms, 0, reloc_type);
9250 }
9251 }
9252 }
9253 }
9254 \f
9255 /* x86_cons_fix_new is called via the expression parsing code when a
9256 reloc is needed. We use this hook to get the correct .got reloc. */
9257 static int cons_sign = -1;
9258
9259 void
9260 x86_cons_fix_new (fragS *frag, unsigned int off, unsigned int len,
9261 expressionS *exp, bfd_reloc_code_real_type r)
9262 {
9263 r = reloc (len, 0, cons_sign, r);
9264
9265 #ifdef TE_PE
9266 if (exp->X_op == O_secrel)
9267 {
9268 exp->X_op = O_symbol;
9269 r = BFD_RELOC_32_SECREL;
9270 }
9271 #endif
9272
9273 fix_new_exp (frag, off, len, exp, 0, r);
9274 }
9275
9276 /* Export the ABI address size for use by TC_ADDRESS_BYTES for the
9277 purpose of the `.dc.a' internal pseudo-op. */
9278
9279 int
9280 x86_address_bytes (void)
9281 {
9282 if ((stdoutput->arch_info->mach & bfd_mach_x64_32))
9283 return 4;
9284 return stdoutput->arch_info->bits_per_address / 8;
9285 }
9286
9287 #if !(defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) || defined (OBJ_MACH_O)) \
9288 || defined (LEX_AT)
9289 # define lex_got(reloc, adjust, types) NULL
9290 #else
9291 /* Parse operands of the form
9292 <symbol>@GOTOFF+<nnn>
9293 and similar .plt or .got references.
9294
9295 If we find one, set up the correct relocation in RELOC and copy the
9296 input string, minus the `@GOTOFF' into a malloc'd buffer for
9297 parsing by the calling routine. Return this buffer, and if ADJUST
9298 is non-null set it to the length of the string we removed from the
9299 input line. Otherwise return NULL. */
9300 static char *
9301 lex_got (enum bfd_reloc_code_real *rel,
9302 int *adjust,
9303 i386_operand_type *types)
9304 {
9305 /* Some of the relocations depend on the size of what field is to
9306 be relocated. But in our callers i386_immediate and i386_displacement
9307 we don't yet know the operand size (this will be set by insn
9308 matching). Hence we record the word32 relocation here,
9309 and adjust the reloc according to the real size in reloc(). */
9310 static const struct {
9311 const char *str;
9312 int len;
9313 const enum bfd_reloc_code_real rel[2];
9314 const i386_operand_type types64;
9315 } gotrel[] = {
9316 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
9317 { STRING_COMMA_LEN ("SIZE"), { BFD_RELOC_SIZE32,
9318 BFD_RELOC_SIZE32 },
9319 OPERAND_TYPE_IMM32_64 },
9320 #endif
9321 { STRING_COMMA_LEN ("PLTOFF"), { _dummy_first_bfd_reloc_code_real,
9322 BFD_RELOC_X86_64_PLTOFF64 },
9323 OPERAND_TYPE_IMM64 },
9324 { STRING_COMMA_LEN ("PLT"), { BFD_RELOC_386_PLT32,
9325 BFD_RELOC_X86_64_PLT32 },
9326 OPERAND_TYPE_IMM32_32S_DISP32 },
9327 { STRING_COMMA_LEN ("GOTPLT"), { _dummy_first_bfd_reloc_code_real,
9328 BFD_RELOC_X86_64_GOTPLT64 },
9329 OPERAND_TYPE_IMM64_DISP64 },
9330 { STRING_COMMA_LEN ("GOTOFF"), { BFD_RELOC_386_GOTOFF,
9331 BFD_RELOC_X86_64_GOTOFF64 },
9332 OPERAND_TYPE_IMM64_DISP64 },
9333 { STRING_COMMA_LEN ("GOTPCREL"), { _dummy_first_bfd_reloc_code_real,
9334 BFD_RELOC_X86_64_GOTPCREL },
9335 OPERAND_TYPE_IMM32_32S_DISP32 },
9336 { STRING_COMMA_LEN ("TLSGD"), { BFD_RELOC_386_TLS_GD,
9337 BFD_RELOC_X86_64_TLSGD },
9338 OPERAND_TYPE_IMM32_32S_DISP32 },
9339 { STRING_COMMA_LEN ("TLSLDM"), { BFD_RELOC_386_TLS_LDM,
9340 _dummy_first_bfd_reloc_code_real },
9341 OPERAND_TYPE_NONE },
9342 { STRING_COMMA_LEN ("TLSLD"), { _dummy_first_bfd_reloc_code_real,
9343 BFD_RELOC_X86_64_TLSLD },
9344 OPERAND_TYPE_IMM32_32S_DISP32 },
9345 { STRING_COMMA_LEN ("GOTTPOFF"), { BFD_RELOC_386_TLS_IE_32,
9346 BFD_RELOC_X86_64_GOTTPOFF },
9347 OPERAND_TYPE_IMM32_32S_DISP32 },
9348 { STRING_COMMA_LEN ("TPOFF"), { BFD_RELOC_386_TLS_LE_32,
9349 BFD_RELOC_X86_64_TPOFF32 },
9350 OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
9351 { STRING_COMMA_LEN ("NTPOFF"), { BFD_RELOC_386_TLS_LE,
9352 _dummy_first_bfd_reloc_code_real },
9353 OPERAND_TYPE_NONE },
9354 { STRING_COMMA_LEN ("DTPOFF"), { BFD_RELOC_386_TLS_LDO_32,
9355 BFD_RELOC_X86_64_DTPOFF32 },
9356 OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
9357 { STRING_COMMA_LEN ("GOTNTPOFF"),{ BFD_RELOC_386_TLS_GOTIE,
9358 _dummy_first_bfd_reloc_code_real },
9359 OPERAND_TYPE_NONE },
9360 { STRING_COMMA_LEN ("INDNTPOFF"),{ BFD_RELOC_386_TLS_IE,
9361 _dummy_first_bfd_reloc_code_real },
9362 OPERAND_TYPE_NONE },
9363 { STRING_COMMA_LEN ("GOT"), { BFD_RELOC_386_GOT32,
9364 BFD_RELOC_X86_64_GOT32 },
9365 OPERAND_TYPE_IMM32_32S_64_DISP32 },
9366 { STRING_COMMA_LEN ("TLSDESC"), { BFD_RELOC_386_TLS_GOTDESC,
9367 BFD_RELOC_X86_64_GOTPC32_TLSDESC },
9368 OPERAND_TYPE_IMM32_32S_DISP32 },
9369 { STRING_COMMA_LEN ("TLSCALL"), { BFD_RELOC_386_TLS_DESC_CALL,
9370 BFD_RELOC_X86_64_TLSDESC_CALL },
9371 OPERAND_TYPE_IMM32_32S_DISP32 },
9372 };
9373 char *cp;
9374 unsigned int j;
9375
9376 #if defined (OBJ_MAYBE_ELF)
9377 if (!IS_ELF)
9378 return NULL;
9379 #endif
9380
9381 for (cp = input_line_pointer; *cp != '@'; cp++)
9382 if (is_end_of_line[(unsigned char) *cp] || *cp == ',')
9383 return NULL;
9384
9385 for (j = 0; j < ARRAY_SIZE (gotrel); j++)
9386 {
9387 int len = gotrel[j].len;
9388 if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
9389 {
9390 if (gotrel[j].rel[object_64bit] != 0)
9391 {
9392 int first, second;
9393 char *tmpbuf, *past_reloc;
9394
9395 *rel = gotrel[j].rel[object_64bit];
9396
9397 if (types)
9398 {
9399 if (flag_code != CODE_64BIT)
9400 {
9401 types->bitfield.imm32 = 1;
9402 types->bitfield.disp32 = 1;
9403 }
9404 else
9405 *types = gotrel[j].types64;
9406 }
9407
9408 if (j != 0 && GOT_symbol == NULL)
9409 GOT_symbol = symbol_find_or_make (GLOBAL_OFFSET_TABLE_NAME);
9410
9411 /* The length of the first part of our input line. */
9412 first = cp - input_line_pointer;
9413
9414 /* The second part goes from after the reloc token until
9415 (and including) an end_of_line char or comma. */
9416 past_reloc = cp + 1 + len;
9417 cp = past_reloc;
9418 while (!is_end_of_line[(unsigned char) *cp] && *cp != ',')
9419 ++cp;
9420 second = cp + 1 - past_reloc;
9421
9422 /* Allocate and copy string. The trailing NUL shouldn't
9423 be necessary, but be safe. */
9424 tmpbuf = XNEWVEC (char, first + second + 2);
9425 memcpy (tmpbuf, input_line_pointer, first);
9426 if (second != 0 && *past_reloc != ' ')
9427 /* Replace the relocation token with ' ', so that
9428 errors like foo@GOTOFF1 will be detected. */
9429 tmpbuf[first++] = ' ';
9430 else
9431 /* Increment length by 1 if the relocation token is
9432 removed. */
9433 len++;
9434 if (adjust)
9435 *adjust = len;
9436 memcpy (tmpbuf + first, past_reloc, second);
9437 tmpbuf[first + second] = '\0';
9438 return tmpbuf;
9439 }
9440
9441 as_bad (_("@%s reloc is not supported with %d-bit output format"),
9442 gotrel[j].str, 1 << (5 + object_64bit));
9443 return NULL;
9444 }
9445 }
9446
9447 /* Might be a symbol version string. Don't as_bad here. */
9448 return NULL;
9449 }
9450 #endif
9451
9452 #ifdef TE_PE
9453 #ifdef lex_got
9454 #undef lex_got
9455 #endif
9456 /* Parse operands of the form
9457 <symbol>@SECREL32+<nnn>
9458
9459 If we find one, set up the correct relocation in RELOC and copy the
9460 input string, minus the `@SECREL32' into a malloc'd buffer for
9461 parsing by the calling routine. Return this buffer, and if ADJUST
9462 is non-null set it to the length of the string we removed from the
9463 input line. Otherwise return NULL.
9464
9465 This function is copied from the ELF version above adjusted for PE targets. */
9466
9467 static char *
9468 lex_got (enum bfd_reloc_code_real *rel ATTRIBUTE_UNUSED,
9469 int *adjust ATTRIBUTE_UNUSED,
9470 i386_operand_type *types)
9471 {
9472 static const struct
9473 {
9474 const char *str;
9475 int len;
9476 const enum bfd_reloc_code_real rel[2];
9477 const i386_operand_type types64;
9478 }
9479 gotrel[] =
9480 {
9481 { STRING_COMMA_LEN ("SECREL32"), { BFD_RELOC_32_SECREL,
9482 BFD_RELOC_32_SECREL },
9483 OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
9484 };
9485
9486 char *cp;
9487 unsigned j;
9488
9489 for (cp = input_line_pointer; *cp != '@'; cp++)
9490 if (is_end_of_line[(unsigned char) *cp] || *cp == ',')
9491 return NULL;
9492
9493 for (j = 0; j < ARRAY_SIZE (gotrel); j++)
9494 {
9495 int len = gotrel[j].len;
9496
9497 if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
9498 {
9499 if (gotrel[j].rel[object_64bit] != 0)
9500 {
9501 int first, second;
9502 char *tmpbuf, *past_reloc;
9503
9504 *rel = gotrel[j].rel[object_64bit];
9505 if (adjust)
9506 *adjust = len;
9507
9508 if (types)
9509 {
9510 if (flag_code != CODE_64BIT)
9511 {
9512 types->bitfield.imm32 = 1;
9513 types->bitfield.disp32 = 1;
9514 }
9515 else
9516 *types = gotrel[j].types64;
9517 }
9518
9519 /* The length of the first part of our input line. */
9520 first = cp - input_line_pointer;
9521
9522 /* The second part goes from after the reloc token until
9523 (and including) an end_of_line char or comma. */
9524 past_reloc = cp + 1 + len;
9525 cp = past_reloc;
9526 while (!is_end_of_line[(unsigned char) *cp] && *cp != ',')
9527 ++cp;
9528 second = cp + 1 - past_reloc;
9529
9530 /* Allocate and copy string. The trailing NUL shouldn't
9531 be necessary, but be safe. */
9532 tmpbuf = XNEWVEC (char, first + second + 2);
9533 memcpy (tmpbuf, input_line_pointer, first);
9534 if (second != 0 && *past_reloc != ' ')
9535 /* Replace the relocation token with ' ', so that
9536 errors like foo@SECLREL321 will be detected. */
9537 tmpbuf[first++] = ' ';
9538 memcpy (tmpbuf + first, past_reloc, second);
9539 tmpbuf[first + second] = '\0';
9540 return tmpbuf;
9541 }
9542
9543 as_bad (_("@%s reloc is not supported with %d-bit output format"),
9544 gotrel[j].str, 1 << (5 + object_64bit));
9545 return NULL;
9546 }
9547 }
9548
9549 /* Might be a symbol version string. Don't as_bad here. */
9550 return NULL;
9551 }
9552
9553 #endif /* TE_PE */
9554
9555 bfd_reloc_code_real_type
9556 x86_cons (expressionS *exp, int size)
9557 {
9558 bfd_reloc_code_real_type got_reloc = NO_RELOC;
9559
9560 intel_syntax = -intel_syntax;
9561
9562 exp->X_md = 0;
9563 if (size == 4 || (object_64bit && size == 8))
9564 {
9565 /* Handle @GOTOFF and the like in an expression. */
9566 char *save;
9567 char *gotfree_input_line;
9568 int adjust = 0;
9569
9570 save = input_line_pointer;
9571 gotfree_input_line = lex_got (&got_reloc, &adjust, NULL);
9572 if (gotfree_input_line)
9573 input_line_pointer = gotfree_input_line;
9574
9575 expression (exp);
9576
9577 if (gotfree_input_line)
9578 {
9579 /* expression () has merrily parsed up to the end of line,
9580 or a comma - in the wrong buffer. Transfer how far
9581 input_line_pointer has moved to the right buffer. */
9582 input_line_pointer = (save
9583 + (input_line_pointer - gotfree_input_line)
9584 + adjust);
9585 free (gotfree_input_line);
9586 if (exp->X_op == O_constant
9587 || exp->X_op == O_absent
9588 || exp->X_op == O_illegal
9589 || exp->X_op == O_register
9590 || exp->X_op == O_big)
9591 {
9592 char c = *input_line_pointer;
9593 *input_line_pointer = 0;
9594 as_bad (_("missing or invalid expression `%s'"), save);
9595 *input_line_pointer = c;
9596 }
9597 else if ((got_reloc == BFD_RELOC_386_PLT32
9598 || got_reloc == BFD_RELOC_X86_64_PLT32)
9599 && exp->X_op != O_symbol)
9600 {
9601 char c = *input_line_pointer;
9602 *input_line_pointer = 0;
9603 as_bad (_("invalid PLT expression `%s'"), save);
9604 *input_line_pointer = c;
9605 }
9606 }
9607 }
9608 else
9609 expression (exp);
9610
9611 intel_syntax = -intel_syntax;
9612
9613 if (intel_syntax)
9614 i386_intel_simplify (exp);
9615
9616 return got_reloc;
9617 }
9618
9619 static void
9620 signed_cons (int size)
9621 {
9622 if (flag_code == CODE_64BIT)
9623 cons_sign = 1;
9624 cons (size);
9625 cons_sign = -1;
9626 }
9627
9628 #ifdef TE_PE
9629 static void
9630 pe_directive_secrel (int dummy ATTRIBUTE_UNUSED)
9631 {
9632 expressionS exp;
9633
9634 do
9635 {
9636 expression (&exp);
9637 if (exp.X_op == O_symbol)
9638 exp.X_op = O_secrel;
9639
9640 emit_expr (&exp, 4);
9641 }
9642 while (*input_line_pointer++ == ',');
9643
9644 input_line_pointer--;
9645 demand_empty_rest_of_line ();
9646 }
9647 #endif
9648
9649 /* Handle Vector operations. */
9650
9651 static char *
9652 check_VecOperations (char *op_string, char *op_end)
9653 {
9654 const reg_entry *mask;
9655 const char *saved;
9656 char *end_op;
9657
9658 while (*op_string
9659 && (op_end == NULL || op_string < op_end))
9660 {
9661 saved = op_string;
9662 if (*op_string == '{')
9663 {
9664 op_string++;
9665
9666 /* Check broadcasts. */
9667 if (strncmp (op_string, "1to", 3) == 0)
9668 {
9669 int bcst_type;
9670
9671 if (i.broadcast)
9672 goto duplicated_vec_op;
9673
9674 op_string += 3;
9675 if (*op_string == '8')
9676 bcst_type = 8;
9677 else if (*op_string == '4')
9678 bcst_type = 4;
9679 else if (*op_string == '2')
9680 bcst_type = 2;
9681 else if (*op_string == '1'
9682 && *(op_string+1) == '6')
9683 {
9684 bcst_type = 16;
9685 op_string++;
9686 }
9687 else
9688 {
9689 as_bad (_("Unsupported broadcast: `%s'"), saved);
9690 return NULL;
9691 }
9692 op_string++;
9693
9694 broadcast_op.type = bcst_type;
9695 broadcast_op.operand = this_operand;
9696 broadcast_op.bytes = 0;
9697 i.broadcast = &broadcast_op;
9698 }
9699 /* Check masking operation. */
9700 else if ((mask = parse_register (op_string, &end_op)) != NULL)
9701 {
9702 /* k0 can't be used for write mask. */
9703 if (mask->reg_type.bitfield.class != RegMask || !mask->reg_num)
9704 {
9705 as_bad (_("`%s%s' can't be used for write mask"),
9706 register_prefix, mask->reg_name);
9707 return NULL;
9708 }
9709
9710 if (!i.mask)
9711 {
9712 mask_op.mask = mask;
9713 mask_op.zeroing = 0;
9714 mask_op.operand = this_operand;
9715 i.mask = &mask_op;
9716 }
9717 else
9718 {
9719 if (i.mask->mask)
9720 goto duplicated_vec_op;
9721
9722 i.mask->mask = mask;
9723
9724 /* Only "{z}" is allowed here. No need to check
9725 zeroing mask explicitly. */
9726 if (i.mask->operand != this_operand)
9727 {
9728 as_bad (_("invalid write mask `%s'"), saved);
9729 return NULL;
9730 }
9731 }
9732
9733 op_string = end_op;
9734 }
9735 /* Check zeroing-flag for masking operation. */
9736 else if (*op_string == 'z')
9737 {
9738 if (!i.mask)
9739 {
9740 mask_op.mask = NULL;
9741 mask_op.zeroing = 1;
9742 mask_op.operand = this_operand;
9743 i.mask = &mask_op;
9744 }
9745 else
9746 {
9747 if (i.mask->zeroing)
9748 {
9749 duplicated_vec_op:
9750 as_bad (_("duplicated `%s'"), saved);
9751 return NULL;
9752 }
9753
9754 i.mask->zeroing = 1;
9755
9756 /* Only "{%k}" is allowed here. No need to check mask
9757 register explicitly. */
9758 if (i.mask->operand != this_operand)
9759 {
9760 as_bad (_("invalid zeroing-masking `%s'"),
9761 saved);
9762 return NULL;
9763 }
9764 }
9765
9766 op_string++;
9767 }
9768 else
9769 goto unknown_vec_op;
9770
9771 if (*op_string != '}')
9772 {
9773 as_bad (_("missing `}' in `%s'"), saved);
9774 return NULL;
9775 }
9776 op_string++;
9777
9778 /* Strip whitespace since the addition of pseudo prefixes
9779 changed how the scrubber treats '{'. */
9780 if (is_space_char (*op_string))
9781 ++op_string;
9782
9783 continue;
9784 }
9785 unknown_vec_op:
9786 /* We don't know this one. */
9787 as_bad (_("unknown vector operation: `%s'"), saved);
9788 return NULL;
9789 }
9790
9791 if (i.mask && i.mask->zeroing && !i.mask->mask)
9792 {
9793 as_bad (_("zeroing-masking only allowed with write mask"));
9794 return NULL;
9795 }
9796
9797 return op_string;
9798 }
9799
9800 static int
9801 i386_immediate (char *imm_start)
9802 {
9803 char *save_input_line_pointer;
9804 char *gotfree_input_line;
9805 segT exp_seg = 0;
9806 expressionS *exp;
9807 i386_operand_type types;
9808
9809 operand_type_set (&types, ~0);
9810
9811 if (i.imm_operands == MAX_IMMEDIATE_OPERANDS)
9812 {
9813 as_bad (_("at most %d immediate operands are allowed"),
9814 MAX_IMMEDIATE_OPERANDS);
9815 return 0;
9816 }
9817
9818 exp = &im_expressions[i.imm_operands++];
9819 i.op[this_operand].imms = exp;
9820
9821 if (is_space_char (*imm_start))
9822 ++imm_start;
9823
9824 save_input_line_pointer = input_line_pointer;
9825 input_line_pointer = imm_start;
9826
9827 gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
9828 if (gotfree_input_line)
9829 input_line_pointer = gotfree_input_line;
9830
9831 exp_seg = expression (exp);
9832
9833 SKIP_WHITESPACE ();
9834
9835 /* Handle vector operations. */
9836 if (*input_line_pointer == '{')
9837 {
9838 input_line_pointer = check_VecOperations (input_line_pointer,
9839 NULL);
9840 if (input_line_pointer == NULL)
9841 return 0;
9842 }
9843
9844 if (*input_line_pointer)
9845 as_bad (_("junk `%s' after expression"), input_line_pointer);
9846
9847 input_line_pointer = save_input_line_pointer;
9848 if (gotfree_input_line)
9849 {
9850 free (gotfree_input_line);
9851
9852 if (exp->X_op == O_constant || exp->X_op == O_register)
9853 exp->X_op = O_illegal;
9854 }
9855
9856 return i386_finalize_immediate (exp_seg, exp, types, imm_start);
9857 }
9858
9859 static int
9860 i386_finalize_immediate (segT exp_seg ATTRIBUTE_UNUSED, expressionS *exp,
9861 i386_operand_type types, const char *imm_start)
9862 {
9863 if (exp->X_op == O_absent || exp->X_op == O_illegal || exp->X_op == O_big)
9864 {
9865 if (imm_start)
9866 as_bad (_("missing or invalid immediate expression `%s'"),
9867 imm_start);
9868 return 0;
9869 }
9870 else if (exp->X_op == O_constant)
9871 {
9872 /* Size it properly later. */
9873 i.types[this_operand].bitfield.imm64 = 1;
9874 /* If not 64bit, sign extend val. */
9875 if (flag_code != CODE_64BIT
9876 && (exp->X_add_number & ~(((addressT) 2 << 31) - 1)) == 0)
9877 exp->X_add_number
9878 = (exp->X_add_number ^ ((addressT) 1 << 31)) - ((addressT) 1 << 31);
9879 }
9880 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
9881 else if (OUTPUT_FLAVOR == bfd_target_aout_flavour
9882 && exp_seg != absolute_section
9883 && exp_seg != text_section
9884 && exp_seg != data_section
9885 && exp_seg != bss_section
9886 && exp_seg != undefined_section
9887 && !bfd_is_com_section (exp_seg))
9888 {
9889 as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
9890 return 0;
9891 }
9892 #endif
9893 else if (!intel_syntax && exp_seg == reg_section)
9894 {
9895 if (imm_start)
9896 as_bad (_("illegal immediate register operand %s"), imm_start);
9897 return 0;
9898 }
9899 else
9900 {
9901 /* This is an address. The size of the address will be
9902 determined later, depending on destination register,
9903 suffix, or the default for the section. */
9904 i.types[this_operand].bitfield.imm8 = 1;
9905 i.types[this_operand].bitfield.imm16 = 1;
9906 i.types[this_operand].bitfield.imm32 = 1;
9907 i.types[this_operand].bitfield.imm32s = 1;
9908 i.types[this_operand].bitfield.imm64 = 1;
9909 i.types[this_operand] = operand_type_and (i.types[this_operand],
9910 types);
9911 }
9912
9913 return 1;
9914 }
9915
9916 static char *
9917 i386_scale (char *scale)
9918 {
9919 offsetT val;
9920 char *save = input_line_pointer;
9921
9922 input_line_pointer = scale;
9923 val = get_absolute_expression ();
9924
9925 switch (val)
9926 {
9927 case 1:
9928 i.log2_scale_factor = 0;
9929 break;
9930 case 2:
9931 i.log2_scale_factor = 1;
9932 break;
9933 case 4:
9934 i.log2_scale_factor = 2;
9935 break;
9936 case 8:
9937 i.log2_scale_factor = 3;
9938 break;
9939 default:
9940 {
9941 char sep = *input_line_pointer;
9942
9943 *input_line_pointer = '\0';
9944 as_bad (_("expecting scale factor of 1, 2, 4, or 8: got `%s'"),
9945 scale);
9946 *input_line_pointer = sep;
9947 input_line_pointer = save;
9948 return NULL;
9949 }
9950 }
9951 if (i.log2_scale_factor != 0 && i.index_reg == 0)
9952 {
9953 as_warn (_("scale factor of %d without an index register"),
9954 1 << i.log2_scale_factor);
9955 i.log2_scale_factor = 0;
9956 }
9957 scale = input_line_pointer;
9958 input_line_pointer = save;
9959 return scale;
9960 }
9961
9962 static int
9963 i386_displacement (char *disp_start, char *disp_end)
9964 {
9965 expressionS *exp;
9966 segT exp_seg = 0;
9967 char *save_input_line_pointer;
9968 char *gotfree_input_line;
9969 int override;
9970 i386_operand_type bigdisp, types = anydisp;
9971 int ret;
9972
9973 if (i.disp_operands == MAX_MEMORY_OPERANDS)
9974 {
9975 as_bad (_("at most %d displacement operands are allowed"),
9976 MAX_MEMORY_OPERANDS);
9977 return 0;
9978 }
9979
9980 operand_type_set (&bigdisp, 0);
9981 if (i.jumpabsolute
9982 || i.types[this_operand].bitfield.baseindex
9983 || (current_templates->start->opcode_modifier.jump != JUMP
9984 && current_templates->start->opcode_modifier.jump != JUMP_DWORD))
9985 {
9986 i386_addressing_mode ();
9987 override = (i.prefix[ADDR_PREFIX] != 0);
9988 if (flag_code == CODE_64BIT)
9989 {
9990 if (!override)
9991 {
9992 bigdisp.bitfield.disp32s = 1;
9993 bigdisp.bitfield.disp64 = 1;
9994 }
9995 else
9996 bigdisp.bitfield.disp32 = 1;
9997 }
9998 else if ((flag_code == CODE_16BIT) ^ override)
9999 bigdisp.bitfield.disp16 = 1;
10000 else
10001 bigdisp.bitfield.disp32 = 1;
10002 }
10003 else
10004 {
10005 /* For PC-relative branches, the width of the displacement may be
10006 dependent upon data size, but is never dependent upon address size.
10007 Also make sure to not unintentionally match against a non-PC-relative
10008 branch template. */
10009 static templates aux_templates;
10010 const insn_template *t = current_templates->start;
10011 bfd_boolean has_intel64 = FALSE;
10012
10013 aux_templates.start = t;
10014 while (++t < current_templates->end)
10015 {
10016 if (t->opcode_modifier.jump
10017 != current_templates->start->opcode_modifier.jump)
10018 break;
10019 if ((t->opcode_modifier.isa64 >= INTEL64))
10020 has_intel64 = TRUE;
10021 }
10022 if (t < current_templates->end)
10023 {
10024 aux_templates.end = t;
10025 current_templates = &aux_templates;
10026 }
10027
10028 override = (i.prefix[DATA_PREFIX] != 0);
10029 if (flag_code == CODE_64BIT)
10030 {
10031 if ((override || i.suffix == WORD_MNEM_SUFFIX)
10032 && (!intel64 || !has_intel64))
10033 bigdisp.bitfield.disp16 = 1;
10034 else
10035 bigdisp.bitfield.disp32s = 1;
10036 }
10037 else
10038 {
10039 if (!override)
10040 override = (i.suffix == (flag_code != CODE_16BIT
10041 ? WORD_MNEM_SUFFIX
10042 : LONG_MNEM_SUFFIX));
10043 bigdisp.bitfield.disp32 = 1;
10044 if ((flag_code == CODE_16BIT) ^ override)
10045 {
10046 bigdisp.bitfield.disp32 = 0;
10047 bigdisp.bitfield.disp16 = 1;
10048 }
10049 }
10050 }
10051 i.types[this_operand] = operand_type_or (i.types[this_operand],
10052 bigdisp);
10053
10054 exp = &disp_expressions[i.disp_operands];
10055 i.op[this_operand].disps = exp;
10056 i.disp_operands++;
10057 save_input_line_pointer = input_line_pointer;
10058 input_line_pointer = disp_start;
10059 END_STRING_AND_SAVE (disp_end);
10060
10061 #ifndef GCC_ASM_O_HACK
10062 #define GCC_ASM_O_HACK 0
10063 #endif
10064 #if GCC_ASM_O_HACK
10065 END_STRING_AND_SAVE (disp_end + 1);
10066 if (i.types[this_operand].bitfield.baseIndex
10067 && displacement_string_end[-1] == '+')
10068 {
10069 /* This hack is to avoid a warning when using the "o"
10070 constraint within gcc asm statements.
10071 For instance:
10072
10073 #define _set_tssldt_desc(n,addr,limit,type) \
10074 __asm__ __volatile__ ( \
10075 "movw %w2,%0\n\t" \
10076 "movw %w1,2+%0\n\t" \
10077 "rorl $16,%1\n\t" \
10078 "movb %b1,4+%0\n\t" \
10079 "movb %4,5+%0\n\t" \
10080 "movb $0,6+%0\n\t" \
10081 "movb %h1,7+%0\n\t" \
10082 "rorl $16,%1" \
10083 : "=o"(*(n)) : "q" (addr), "ri"(limit), "i"(type))
10084
10085 This works great except that the output assembler ends
10086 up looking a bit weird if it turns out that there is
10087 no offset. You end up producing code that looks like:
10088
10089 #APP
10090 movw $235,(%eax)
10091 movw %dx,2+(%eax)
10092 rorl $16,%edx
10093 movb %dl,4+(%eax)
10094 movb $137,5+(%eax)
10095 movb $0,6+(%eax)
10096 movb %dh,7+(%eax)
10097 rorl $16,%edx
10098 #NO_APP
10099
10100 So here we provide the missing zero. */
10101
10102 *displacement_string_end = '0';
10103 }
10104 #endif
10105 gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
10106 if (gotfree_input_line)
10107 input_line_pointer = gotfree_input_line;
10108
10109 exp_seg = expression (exp);
10110
10111 SKIP_WHITESPACE ();
10112 if (*input_line_pointer)
10113 as_bad (_("junk `%s' after expression"), input_line_pointer);
10114 #if GCC_ASM_O_HACK
10115 RESTORE_END_STRING (disp_end + 1);
10116 #endif
10117 input_line_pointer = save_input_line_pointer;
10118 if (gotfree_input_line)
10119 {
10120 free (gotfree_input_line);
10121
10122 if (exp->X_op == O_constant || exp->X_op == O_register)
10123 exp->X_op = O_illegal;
10124 }
10125
10126 ret = i386_finalize_displacement (exp_seg, exp, types, disp_start);
10127
10128 RESTORE_END_STRING (disp_end);
10129
10130 return ret;
10131 }
10132
10133 static int
10134 i386_finalize_displacement (segT exp_seg ATTRIBUTE_UNUSED, expressionS *exp,
10135 i386_operand_type types, const char *disp_start)
10136 {
10137 i386_operand_type bigdisp;
10138 int ret = 1;
10139
10140 /* We do this to make sure that the section symbol is in
10141 the symbol table. We will ultimately change the relocation
10142 to be relative to the beginning of the section. */
10143 if (i.reloc[this_operand] == BFD_RELOC_386_GOTOFF
10144 || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL
10145 || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
10146 {
10147 if (exp->X_op != O_symbol)
10148 goto inv_disp;
10149
10150 if (S_IS_LOCAL (exp->X_add_symbol)
10151 && S_GET_SEGMENT (exp->X_add_symbol) != undefined_section
10152 && S_GET_SEGMENT (exp->X_add_symbol) != expr_section)
10153 section_symbol (S_GET_SEGMENT (exp->X_add_symbol));
10154 exp->X_op = O_subtract;
10155 exp->X_op_symbol = GOT_symbol;
10156 if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL)
10157 i.reloc[this_operand] = BFD_RELOC_32_PCREL;
10158 else if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
10159 i.reloc[this_operand] = BFD_RELOC_64;
10160 else
10161 i.reloc[this_operand] = BFD_RELOC_32;
10162 }
10163
10164 else if (exp->X_op == O_absent
10165 || exp->X_op == O_illegal
10166 || exp->X_op == O_big)
10167 {
10168 inv_disp:
10169 as_bad (_("missing or invalid displacement expression `%s'"),
10170 disp_start);
10171 ret = 0;
10172 }
10173
10174 else if (flag_code == CODE_64BIT
10175 && !i.prefix[ADDR_PREFIX]
10176 && exp->X_op == O_constant)
10177 {
10178 /* Since displacement is signed extended to 64bit, don't allow
10179 disp32 and turn off disp32s if they are out of range. */
10180 i.types[this_operand].bitfield.disp32 = 0;
10181 if (!fits_in_signed_long (exp->X_add_number))
10182 {
10183 i.types[this_operand].bitfield.disp32s = 0;
10184 if (i.types[this_operand].bitfield.baseindex)
10185 {
10186 as_bad (_("0x%lx out range of signed 32bit displacement"),
10187 (long) exp->X_add_number);
10188 ret = 0;
10189 }
10190 }
10191 }
10192
10193 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
10194 else if (exp->X_op != O_constant
10195 && OUTPUT_FLAVOR == bfd_target_aout_flavour
10196 && exp_seg != absolute_section
10197 && exp_seg != text_section
10198 && exp_seg != data_section
10199 && exp_seg != bss_section
10200 && exp_seg != undefined_section
10201 && !bfd_is_com_section (exp_seg))
10202 {
10203 as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
10204 ret = 0;
10205 }
10206 #endif
10207
10208 if (current_templates->start->opcode_modifier.jump == JUMP_BYTE
10209 /* Constants get taken care of by optimize_disp(). */
10210 && exp->X_op != O_constant)
10211 i.types[this_operand].bitfield.disp8 = 1;
10212
10213 /* Check if this is a displacement only operand. */
10214 bigdisp = i.types[this_operand];
10215 bigdisp.bitfield.disp8 = 0;
10216 bigdisp.bitfield.disp16 = 0;
10217 bigdisp.bitfield.disp32 = 0;
10218 bigdisp.bitfield.disp32s = 0;
10219 bigdisp.bitfield.disp64 = 0;
10220 if (operand_type_all_zero (&bigdisp))
10221 i.types[this_operand] = operand_type_and (i.types[this_operand],
10222 types);
10223
10224 return ret;
10225 }
10226
10227 /* Return the active addressing mode, taking address override and
10228 registers forming the address into consideration. Update the
10229 address override prefix if necessary. */
10230
10231 static enum flag_code
10232 i386_addressing_mode (void)
10233 {
10234 enum flag_code addr_mode;
10235
10236 if (i.prefix[ADDR_PREFIX])
10237 addr_mode = flag_code == CODE_32BIT ? CODE_16BIT : CODE_32BIT;
10238 else
10239 {
10240 addr_mode = flag_code;
10241
10242 #if INFER_ADDR_PREFIX
10243 if (i.mem_operands == 0)
10244 {
10245 /* Infer address prefix from the first memory operand. */
10246 const reg_entry *addr_reg = i.base_reg;
10247
10248 if (addr_reg == NULL)
10249 addr_reg = i.index_reg;
10250
10251 if (addr_reg)
10252 {
10253 if (addr_reg->reg_type.bitfield.dword)
10254 addr_mode = CODE_32BIT;
10255 else if (flag_code != CODE_64BIT
10256 && addr_reg->reg_type.bitfield.word)
10257 addr_mode = CODE_16BIT;
10258
10259 if (addr_mode != flag_code)
10260 {
10261 i.prefix[ADDR_PREFIX] = ADDR_PREFIX_OPCODE;
10262 i.prefixes += 1;
10263 /* Change the size of any displacement too. At most one
10264 of Disp16 or Disp32 is set.
10265 FIXME. There doesn't seem to be any real need for
10266 separate Disp16 and Disp32 flags. The same goes for
10267 Imm16 and Imm32. Removing them would probably clean
10268 up the code quite a lot. */
10269 if (flag_code != CODE_64BIT
10270 && (i.types[this_operand].bitfield.disp16
10271 || i.types[this_operand].bitfield.disp32))
10272 i.types[this_operand]
10273 = operand_type_xor (i.types[this_operand], disp16_32);
10274 }
10275 }
10276 }
10277 #endif
10278 }
10279
10280 return addr_mode;
10281 }
10282
10283 /* Make sure the memory operand we've been dealt is valid.
10284 Return 1 on success, 0 on a failure. */
10285
10286 static int
10287 i386_index_check (const char *operand_string)
10288 {
10289 const char *kind = "base/index";
10290 enum flag_code addr_mode = i386_addressing_mode ();
10291
10292 if (current_templates->start->opcode_modifier.isstring
10293 && !current_templates->start->cpu_flags.bitfield.cpupadlock
10294 && (current_templates->end[-1].opcode_modifier.isstring
10295 || i.mem_operands))
10296 {
10297 /* Memory operands of string insns are special in that they only allow
10298 a single register (rDI, rSI, or rBX) as their memory address. */
10299 const reg_entry *expected_reg;
10300 static const char *di_si[][2] =
10301 {
10302 { "esi", "edi" },
10303 { "si", "di" },
10304 { "rsi", "rdi" }
10305 };
10306 static const char *bx[] = { "ebx", "bx", "rbx" };
10307
10308 kind = "string address";
10309
10310 if (current_templates->start->opcode_modifier.repprefixok)
10311 {
10312 int es_op = current_templates->end[-1].opcode_modifier.isstring
10313 - IS_STRING_ES_OP0;
10314 int op = 0;
10315
10316 if (!current_templates->end[-1].operand_types[0].bitfield.baseindex
10317 || ((!i.mem_operands != !intel_syntax)
10318 && current_templates->end[-1].operand_types[1]
10319 .bitfield.baseindex))
10320 op = 1;
10321 expected_reg = hash_find (reg_hash, di_si[addr_mode][op == es_op]);
10322 }
10323 else
10324 expected_reg = hash_find (reg_hash, bx[addr_mode]);
10325
10326 if (i.base_reg != expected_reg
10327 || i.index_reg
10328 || operand_type_check (i.types[this_operand], disp))
10329 {
10330 /* The second memory operand must have the same size as
10331 the first one. */
10332 if (i.mem_operands
10333 && i.base_reg
10334 && !((addr_mode == CODE_64BIT
10335 && i.base_reg->reg_type.bitfield.qword)
10336 || (addr_mode == CODE_32BIT
10337 ? i.base_reg->reg_type.bitfield.dword
10338 : i.base_reg->reg_type.bitfield.word)))
10339 goto bad_address;
10340
10341 as_warn (_("`%s' is not valid here (expected `%c%s%s%c')"),
10342 operand_string,
10343 intel_syntax ? '[' : '(',
10344 register_prefix,
10345 expected_reg->reg_name,
10346 intel_syntax ? ']' : ')');
10347 return 1;
10348 }
10349 else
10350 return 1;
10351
10352 bad_address:
10353 as_bad (_("`%s' is not a valid %s expression"),
10354 operand_string, kind);
10355 return 0;
10356 }
10357 else
10358 {
10359 if (addr_mode != CODE_16BIT)
10360 {
10361 /* 32-bit/64-bit checks. */
10362 if ((i.base_reg
10363 && ((addr_mode == CODE_64BIT
10364 ? !i.base_reg->reg_type.bitfield.qword
10365 : !i.base_reg->reg_type.bitfield.dword)
10366 || (i.index_reg && i.base_reg->reg_num == RegIP)
10367 || i.base_reg->reg_num == RegIZ))
10368 || (i.index_reg
10369 && !i.index_reg->reg_type.bitfield.xmmword
10370 && !i.index_reg->reg_type.bitfield.ymmword
10371 && !i.index_reg->reg_type.bitfield.zmmword
10372 && ((addr_mode == CODE_64BIT
10373 ? !i.index_reg->reg_type.bitfield.qword
10374 : !i.index_reg->reg_type.bitfield.dword)
10375 || !i.index_reg->reg_type.bitfield.baseindex)))
10376 goto bad_address;
10377
10378 /* bndmk, bndldx, and bndstx have special restrictions. */
10379 if (current_templates->start->base_opcode == 0xf30f1b
10380 || (current_templates->start->base_opcode & ~1) == 0x0f1a)
10381 {
10382 /* They cannot use RIP-relative addressing. */
10383 if (i.base_reg && i.base_reg->reg_num == RegIP)
10384 {
10385 as_bad (_("`%s' cannot be used here"), operand_string);
10386 return 0;
10387 }
10388
10389 /* bndldx and bndstx ignore their scale factor. */
10390 if (current_templates->start->base_opcode != 0xf30f1b
10391 && i.log2_scale_factor)
10392 as_warn (_("register scaling is being ignored here"));
10393 }
10394 }
10395 else
10396 {
10397 /* 16-bit checks. */
10398 if ((i.base_reg
10399 && (!i.base_reg->reg_type.bitfield.word
10400 || !i.base_reg->reg_type.bitfield.baseindex))
10401 || (i.index_reg
10402 && (!i.index_reg->reg_type.bitfield.word
10403 || !i.index_reg->reg_type.bitfield.baseindex
10404 || !(i.base_reg
10405 && i.base_reg->reg_num < 6
10406 && i.index_reg->reg_num >= 6
10407 && i.log2_scale_factor == 0))))
10408 goto bad_address;
10409 }
10410 }
10411 return 1;
10412 }
10413
10414 /* Handle vector immediates. */
10415
10416 static int
10417 RC_SAE_immediate (const char *imm_start)
10418 {
10419 unsigned int match_found, j;
10420 const char *pstr = imm_start;
10421 expressionS *exp;
10422
10423 if (*pstr != '{')
10424 return 0;
10425
10426 pstr++;
10427 match_found = 0;
10428 for (j = 0; j < ARRAY_SIZE (RC_NamesTable); j++)
10429 {
10430 if (!strncmp (pstr, RC_NamesTable[j].name, RC_NamesTable[j].len))
10431 {
10432 if (!i.rounding)
10433 {
10434 rc_op.type = RC_NamesTable[j].type;
10435 rc_op.operand = this_operand;
10436 i.rounding = &rc_op;
10437 }
10438 else
10439 {
10440 as_bad (_("duplicated `%s'"), imm_start);
10441 return 0;
10442 }
10443 pstr += RC_NamesTable[j].len;
10444 match_found = 1;
10445 break;
10446 }
10447 }
10448 if (!match_found)
10449 return 0;
10450
10451 if (*pstr++ != '}')
10452 {
10453 as_bad (_("Missing '}': '%s'"), imm_start);
10454 return 0;
10455 }
10456 /* RC/SAE immediate string should contain nothing more. */;
10457 if (*pstr != 0)
10458 {
10459 as_bad (_("Junk after '}': '%s'"), imm_start);
10460 return 0;
10461 }
10462
10463 exp = &im_expressions[i.imm_operands++];
10464 i.op[this_operand].imms = exp;
10465
10466 exp->X_op = O_constant;
10467 exp->X_add_number = 0;
10468 exp->X_add_symbol = (symbolS *) 0;
10469 exp->X_op_symbol = (symbolS *) 0;
10470
10471 i.types[this_operand].bitfield.imm8 = 1;
10472 return 1;
10473 }
10474
10475 /* Only string instructions can have a second memory operand, so
10476 reduce current_templates to just those if it contains any. */
10477 static int
10478 maybe_adjust_templates (void)
10479 {
10480 const insn_template *t;
10481
10482 gas_assert (i.mem_operands == 1);
10483
10484 for (t = current_templates->start; t < current_templates->end; ++t)
10485 if (t->opcode_modifier.isstring)
10486 break;
10487
10488 if (t < current_templates->end)
10489 {
10490 static templates aux_templates;
10491 bfd_boolean recheck;
10492
10493 aux_templates.start = t;
10494 for (; t < current_templates->end; ++t)
10495 if (!t->opcode_modifier.isstring)
10496 break;
10497 aux_templates.end = t;
10498
10499 /* Determine whether to re-check the first memory operand. */
10500 recheck = (aux_templates.start != current_templates->start
10501 || t != current_templates->end);
10502
10503 current_templates = &aux_templates;
10504
10505 if (recheck)
10506 {
10507 i.mem_operands = 0;
10508 if (i.memop1_string != NULL
10509 && i386_index_check (i.memop1_string) == 0)
10510 return 0;
10511 i.mem_operands = 1;
10512 }
10513 }
10514
10515 return 1;
10516 }
10517
10518 /* Parse OPERAND_STRING into the i386_insn structure I. Returns zero
10519 on error. */
10520
10521 static int
10522 i386_att_operand (char *operand_string)
10523 {
10524 const reg_entry *r;
10525 char *end_op;
10526 char *op_string = operand_string;
10527
10528 if (is_space_char (*op_string))
10529 ++op_string;
10530
10531 /* We check for an absolute prefix (differentiating,
10532 for example, 'jmp pc_relative_label' from 'jmp *absolute_label'. */
10533 if (*op_string == ABSOLUTE_PREFIX)
10534 {
10535 ++op_string;
10536 if (is_space_char (*op_string))
10537 ++op_string;
10538 i.jumpabsolute = TRUE;
10539 }
10540
10541 /* Check if operand is a register. */
10542 if ((r = parse_register (op_string, &end_op)) != NULL)
10543 {
10544 i386_operand_type temp;
10545
10546 /* Check for a segment override by searching for ':' after a
10547 segment register. */
10548 op_string = end_op;
10549 if (is_space_char (*op_string))
10550 ++op_string;
10551 if (*op_string == ':' && r->reg_type.bitfield.class == SReg)
10552 {
10553 switch (r->reg_num)
10554 {
10555 case 0:
10556 i.seg[i.mem_operands] = &es;
10557 break;
10558 case 1:
10559 i.seg[i.mem_operands] = &cs;
10560 break;
10561 case 2:
10562 i.seg[i.mem_operands] = &ss;
10563 break;
10564 case 3:
10565 i.seg[i.mem_operands] = &ds;
10566 break;
10567 case 4:
10568 i.seg[i.mem_operands] = &fs;
10569 break;
10570 case 5:
10571 i.seg[i.mem_operands] = &gs;
10572 break;
10573 }
10574
10575 /* Skip the ':' and whitespace. */
10576 ++op_string;
10577 if (is_space_char (*op_string))
10578 ++op_string;
10579
10580 if (!is_digit_char (*op_string)
10581 && !is_identifier_char (*op_string)
10582 && *op_string != '('
10583 && *op_string != ABSOLUTE_PREFIX)
10584 {
10585 as_bad (_("bad memory operand `%s'"), op_string);
10586 return 0;
10587 }
10588 /* Handle case of %es:*foo. */
10589 if (*op_string == ABSOLUTE_PREFIX)
10590 {
10591 ++op_string;
10592 if (is_space_char (*op_string))
10593 ++op_string;
10594 i.jumpabsolute = TRUE;
10595 }
10596 goto do_memory_reference;
10597 }
10598
10599 /* Handle vector operations. */
10600 if (*op_string == '{')
10601 {
10602 op_string = check_VecOperations (op_string, NULL);
10603 if (op_string == NULL)
10604 return 0;
10605 }
10606
10607 if (*op_string)
10608 {
10609 as_bad (_("junk `%s' after register"), op_string);
10610 return 0;
10611 }
10612 temp = r->reg_type;
10613 temp.bitfield.baseindex = 0;
10614 i.types[this_operand] = operand_type_or (i.types[this_operand],
10615 temp);
10616 i.types[this_operand].bitfield.unspecified = 0;
10617 i.op[this_operand].regs = r;
10618 i.reg_operands++;
10619 }
10620 else if (*op_string == REGISTER_PREFIX)
10621 {
10622 as_bad (_("bad register name `%s'"), op_string);
10623 return 0;
10624 }
10625 else if (*op_string == IMMEDIATE_PREFIX)
10626 {
10627 ++op_string;
10628 if (i.jumpabsolute)
10629 {
10630 as_bad (_("immediate operand illegal with absolute jump"));
10631 return 0;
10632 }
10633 if (!i386_immediate (op_string))
10634 return 0;
10635 }
10636 else if (RC_SAE_immediate (operand_string))
10637 {
10638 /* If it is a RC or SAE immediate, do nothing. */
10639 ;
10640 }
10641 else if (is_digit_char (*op_string)
10642 || is_identifier_char (*op_string)
10643 || *op_string == '"'
10644 || *op_string == '(')
10645 {
10646 /* This is a memory reference of some sort. */
10647 char *base_string;
10648
10649 /* Start and end of displacement string expression (if found). */
10650 char *displacement_string_start;
10651 char *displacement_string_end;
10652 char *vop_start;
10653
10654 do_memory_reference:
10655 if (i.mem_operands == 1 && !maybe_adjust_templates ())
10656 return 0;
10657 if ((i.mem_operands == 1
10658 && !current_templates->start->opcode_modifier.isstring)
10659 || i.mem_operands == 2)
10660 {
10661 as_bad (_("too many memory references for `%s'"),
10662 current_templates->start->name);
10663 return 0;
10664 }
10665
10666 /* Check for base index form. We detect the base index form by
10667 looking for an ')' at the end of the operand, searching
10668 for the '(' matching it, and finding a REGISTER_PREFIX or ','
10669 after the '('. */
10670 base_string = op_string + strlen (op_string);
10671
10672 /* Handle vector operations. */
10673 vop_start = strchr (op_string, '{');
10674 if (vop_start && vop_start < base_string)
10675 {
10676 if (check_VecOperations (vop_start, base_string) == NULL)
10677 return 0;
10678 base_string = vop_start;
10679 }
10680
10681 --base_string;
10682 if (is_space_char (*base_string))
10683 --base_string;
10684
10685 /* If we only have a displacement, set-up for it to be parsed later. */
10686 displacement_string_start = op_string;
10687 displacement_string_end = base_string + 1;
10688
10689 if (*base_string == ')')
10690 {
10691 char *temp_string;
10692 unsigned int parens_balanced = 1;
10693 /* We've already checked that the number of left & right ()'s are
10694 equal, so this loop will not be infinite. */
10695 do
10696 {
10697 base_string--;
10698 if (*base_string == ')')
10699 parens_balanced++;
10700 if (*base_string == '(')
10701 parens_balanced--;
10702 }
10703 while (parens_balanced);
10704
10705 temp_string = base_string;
10706
10707 /* Skip past '(' and whitespace. */
10708 ++base_string;
10709 if (is_space_char (*base_string))
10710 ++base_string;
10711
10712 if (*base_string == ','
10713 || ((i.base_reg = parse_register (base_string, &end_op))
10714 != NULL))
10715 {
10716 displacement_string_end = temp_string;
10717
10718 i.types[this_operand].bitfield.baseindex = 1;
10719
10720 if (i.base_reg)
10721 {
10722 base_string = end_op;
10723 if (is_space_char (*base_string))
10724 ++base_string;
10725 }
10726
10727 /* There may be an index reg or scale factor here. */
10728 if (*base_string == ',')
10729 {
10730 ++base_string;
10731 if (is_space_char (*base_string))
10732 ++base_string;
10733
10734 if ((i.index_reg = parse_register (base_string, &end_op))
10735 != NULL)
10736 {
10737 base_string = end_op;
10738 if (is_space_char (*base_string))
10739 ++base_string;
10740 if (*base_string == ',')
10741 {
10742 ++base_string;
10743 if (is_space_char (*base_string))
10744 ++base_string;
10745 }
10746 else if (*base_string != ')')
10747 {
10748 as_bad (_("expecting `,' or `)' "
10749 "after index register in `%s'"),
10750 operand_string);
10751 return 0;
10752 }
10753 }
10754 else if (*base_string == REGISTER_PREFIX)
10755 {
10756 end_op = strchr (base_string, ',');
10757 if (end_op)
10758 *end_op = '\0';
10759 as_bad (_("bad register name `%s'"), base_string);
10760 return 0;
10761 }
10762
10763 /* Check for scale factor. */
10764 if (*base_string != ')')
10765 {
10766 char *end_scale = i386_scale (base_string);
10767
10768 if (!end_scale)
10769 return 0;
10770
10771 base_string = end_scale;
10772 if (is_space_char (*base_string))
10773 ++base_string;
10774 if (*base_string != ')')
10775 {
10776 as_bad (_("expecting `)' "
10777 "after scale factor in `%s'"),
10778 operand_string);
10779 return 0;
10780 }
10781 }
10782 else if (!i.index_reg)
10783 {
10784 as_bad (_("expecting index register or scale factor "
10785 "after `,'; got '%c'"),
10786 *base_string);
10787 return 0;
10788 }
10789 }
10790 else if (*base_string != ')')
10791 {
10792 as_bad (_("expecting `,' or `)' "
10793 "after base register in `%s'"),
10794 operand_string);
10795 return 0;
10796 }
10797 }
10798 else if (*base_string == REGISTER_PREFIX)
10799 {
10800 end_op = strchr (base_string, ',');
10801 if (end_op)
10802 *end_op = '\0';
10803 as_bad (_("bad register name `%s'"), base_string);
10804 return 0;
10805 }
10806 }
10807
10808 /* If there's an expression beginning the operand, parse it,
10809 assuming displacement_string_start and
10810 displacement_string_end are meaningful. */
10811 if (displacement_string_start != displacement_string_end)
10812 {
10813 if (!i386_displacement (displacement_string_start,
10814 displacement_string_end))
10815 return 0;
10816 }
10817
10818 /* Special case for (%dx) while doing input/output op. */
10819 if (i.base_reg
10820 && i.base_reg->reg_type.bitfield.instance == RegD
10821 && i.base_reg->reg_type.bitfield.word
10822 && i.index_reg == 0
10823 && i.log2_scale_factor == 0
10824 && i.seg[i.mem_operands] == 0
10825 && !operand_type_check (i.types[this_operand], disp))
10826 {
10827 i.types[this_operand] = i.base_reg->reg_type;
10828 return 1;
10829 }
10830
10831 if (i386_index_check (operand_string) == 0)
10832 return 0;
10833 i.flags[this_operand] |= Operand_Mem;
10834 if (i.mem_operands == 0)
10835 i.memop1_string = xstrdup (operand_string);
10836 i.mem_operands++;
10837 }
10838 else
10839 {
10840 /* It's not a memory operand; argh! */
10841 as_bad (_("invalid char %s beginning operand %d `%s'"),
10842 output_invalid (*op_string),
10843 this_operand + 1,
10844 op_string);
10845 return 0;
10846 }
10847 return 1; /* Normal return. */
10848 }
10849 \f
10850 /* Calculate the maximum variable size (i.e., excluding fr_fix)
10851 that an rs_machine_dependent frag may reach. */
10852
10853 unsigned int
10854 i386_frag_max_var (fragS *frag)
10855 {
10856 /* The only relaxable frags are for jumps.
10857 Unconditional jumps can grow by 4 bytes and others by 5 bytes. */
10858 gas_assert (frag->fr_type == rs_machine_dependent);
10859 return TYPE_FROM_RELAX_STATE (frag->fr_subtype) == UNCOND_JUMP ? 4 : 5;
10860 }
10861
10862 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
10863 static int
10864 elf_symbol_resolved_in_segment_p (symbolS *fr_symbol, offsetT fr_var)
10865 {
10866 /* STT_GNU_IFUNC symbol must go through PLT. */
10867 if ((symbol_get_bfdsym (fr_symbol)->flags
10868 & BSF_GNU_INDIRECT_FUNCTION) != 0)
10869 return 0;
10870
10871 if (!S_IS_EXTERNAL (fr_symbol))
10872 /* Symbol may be weak or local. */
10873 return !S_IS_WEAK (fr_symbol);
10874
10875 /* Global symbols with non-default visibility can't be preempted. */
10876 if (ELF_ST_VISIBILITY (S_GET_OTHER (fr_symbol)) != STV_DEFAULT)
10877 return 1;
10878
10879 if (fr_var != NO_RELOC)
10880 switch ((enum bfd_reloc_code_real) fr_var)
10881 {
10882 case BFD_RELOC_386_PLT32:
10883 case BFD_RELOC_X86_64_PLT32:
10884 /* Symbol with PLT relocation may be preempted. */
10885 return 0;
10886 default:
10887 abort ();
10888 }
10889
10890 /* Global symbols with default visibility in a shared library may be
10891 preempted by another definition. */
10892 return !shared;
10893 }
10894 #endif
10895
10896 /* Return the next non-empty frag. */
10897
10898 static fragS *
10899 i386_next_non_empty_frag (fragS *fragP)
10900 {
10901 /* There may be a frag with a ".fill 0" when there is no room in
10902 the current frag for frag_grow in output_insn. */
10903 for (fragP = fragP->fr_next;
10904 (fragP != NULL
10905 && fragP->fr_type == rs_fill
10906 && fragP->fr_fix == 0);
10907 fragP = fragP->fr_next)
10908 ;
10909 return fragP;
10910 }
10911
10912 /* Return the next jcc frag after BRANCH_PADDING. */
10913
10914 static fragS *
10915 i386_next_jcc_frag (fragS *fragP)
10916 {
10917 if (!fragP)
10918 return NULL;
10919
10920 if (fragP->fr_type == rs_machine_dependent
10921 && (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
10922 == BRANCH_PADDING))
10923 {
10924 fragP = i386_next_non_empty_frag (fragP);
10925 if (fragP->fr_type != rs_machine_dependent)
10926 return NULL;
10927 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == COND_JUMP)
10928 return fragP;
10929 }
10930
10931 return NULL;
10932 }
10933
10934 /* Classify BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING frags. */
10935
10936 static void
10937 i386_classify_machine_dependent_frag (fragS *fragP)
10938 {
10939 fragS *cmp_fragP;
10940 fragS *pad_fragP;
10941 fragS *branch_fragP;
10942 fragS *next_fragP;
10943 unsigned int max_prefix_length;
10944
10945 if (fragP->tc_frag_data.classified)
10946 return;
10947
10948 /* First scan for BRANCH_PADDING and FUSED_JCC_PADDING. Convert
10949 FUSED_JCC_PADDING and merge BRANCH_PADDING. */
10950 for (next_fragP = fragP;
10951 next_fragP != NULL;
10952 next_fragP = next_fragP->fr_next)
10953 {
10954 next_fragP->tc_frag_data.classified = 1;
10955 if (next_fragP->fr_type == rs_machine_dependent)
10956 switch (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype))
10957 {
10958 case BRANCH_PADDING:
10959 /* The BRANCH_PADDING frag must be followed by a branch
10960 frag. */
10961 branch_fragP = i386_next_non_empty_frag (next_fragP);
10962 next_fragP->tc_frag_data.u.branch_fragP = branch_fragP;
10963 break;
10964 case FUSED_JCC_PADDING:
10965 /* Check if this is a fused jcc:
10966 FUSED_JCC_PADDING
10967 CMP like instruction
10968 BRANCH_PADDING
10969 COND_JUMP
10970 */
10971 cmp_fragP = i386_next_non_empty_frag (next_fragP);
10972 pad_fragP = i386_next_non_empty_frag (cmp_fragP);
10973 branch_fragP = i386_next_jcc_frag (pad_fragP);
10974 if (branch_fragP)
10975 {
10976 /* The BRANCH_PADDING frag is merged with the
10977 FUSED_JCC_PADDING frag. */
10978 next_fragP->tc_frag_data.u.branch_fragP = branch_fragP;
10979 /* CMP like instruction size. */
10980 next_fragP->tc_frag_data.cmp_size = cmp_fragP->fr_fix;
10981 frag_wane (pad_fragP);
10982 /* Skip to branch_fragP. */
10983 next_fragP = branch_fragP;
10984 }
10985 else if (next_fragP->tc_frag_data.max_prefix_length)
10986 {
10987 /* Turn FUSED_JCC_PADDING into BRANCH_PREFIX if it isn't
10988 a fused jcc. */
10989 next_fragP->fr_subtype
10990 = ENCODE_RELAX_STATE (BRANCH_PREFIX, 0);
10991 next_fragP->tc_frag_data.max_bytes
10992 = next_fragP->tc_frag_data.max_prefix_length;
10993 /* This will be updated in the BRANCH_PREFIX scan. */
10994 next_fragP->tc_frag_data.max_prefix_length = 0;
10995 }
10996 else
10997 frag_wane (next_fragP);
10998 break;
10999 }
11000 }
11001
11002 /* Stop if there is no BRANCH_PREFIX. */
11003 if (!align_branch_prefix_size)
11004 return;
11005
11006 /* Scan for BRANCH_PREFIX. */
11007 for (; fragP != NULL; fragP = fragP->fr_next)
11008 {
11009 if (fragP->fr_type != rs_machine_dependent
11010 || (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
11011 != BRANCH_PREFIX))
11012 continue;
11013
11014 /* Count all BRANCH_PREFIX frags before BRANCH_PADDING and
11015 COND_JUMP_PREFIX. */
11016 max_prefix_length = 0;
11017 for (next_fragP = fragP;
11018 next_fragP != NULL;
11019 next_fragP = next_fragP->fr_next)
11020 {
11021 if (next_fragP->fr_type == rs_fill)
11022 /* Skip rs_fill frags. */
11023 continue;
11024 else if (next_fragP->fr_type != rs_machine_dependent)
11025 /* Stop for all other frags. */
11026 break;
11027
11028 /* rs_machine_dependent frags. */
11029 if (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11030 == BRANCH_PREFIX)
11031 {
11032 /* Count BRANCH_PREFIX frags. */
11033 if (max_prefix_length >= MAX_FUSED_JCC_PADDING_SIZE)
11034 {
11035 max_prefix_length = MAX_FUSED_JCC_PADDING_SIZE;
11036 frag_wane (next_fragP);
11037 }
11038 else
11039 max_prefix_length
11040 += next_fragP->tc_frag_data.max_bytes;
11041 }
11042 else if ((TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11043 == BRANCH_PADDING)
11044 || (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11045 == FUSED_JCC_PADDING))
11046 {
11047 /* Stop at BRANCH_PADDING and FUSED_JCC_PADDING. */
11048 fragP->tc_frag_data.u.padding_fragP = next_fragP;
11049 break;
11050 }
11051 else
11052 /* Stop for other rs_machine_dependent frags. */
11053 break;
11054 }
11055
11056 fragP->tc_frag_data.max_prefix_length = max_prefix_length;
11057
11058 /* Skip to the next frag. */
11059 fragP = next_fragP;
11060 }
11061 }
11062
11063 /* Compute padding size for
11064
11065 FUSED_JCC_PADDING
11066 CMP like instruction
11067 BRANCH_PADDING
11068 COND_JUMP/UNCOND_JUMP
11069
11070 or
11071
11072 BRANCH_PADDING
11073 COND_JUMP/UNCOND_JUMP
11074 */
11075
11076 static int
11077 i386_branch_padding_size (fragS *fragP, offsetT address)
11078 {
11079 unsigned int offset, size, padding_size;
11080 fragS *branch_fragP = fragP->tc_frag_data.u.branch_fragP;
11081
11082 /* The start address of the BRANCH_PADDING or FUSED_JCC_PADDING frag. */
11083 if (!address)
11084 address = fragP->fr_address;
11085 address += fragP->fr_fix;
11086
11087 /* CMP like instrunction size. */
11088 size = fragP->tc_frag_data.cmp_size;
11089
11090 /* The base size of the branch frag. */
11091 size += branch_fragP->fr_fix;
11092
11093 /* Add opcode and displacement bytes for the rs_machine_dependent
11094 branch frag. */
11095 if (branch_fragP->fr_type == rs_machine_dependent)
11096 size += md_relax_table[branch_fragP->fr_subtype].rlx_length;
11097
11098 /* Check if branch is within boundary and doesn't end at the last
11099 byte. */
11100 offset = address & ((1U << align_branch_power) - 1);
11101 if ((offset + size) >= (1U << align_branch_power))
11102 /* Padding needed to avoid crossing boundary. */
11103 padding_size = (1U << align_branch_power) - offset;
11104 else
11105 /* No padding needed. */
11106 padding_size = 0;
11107
11108 /* The return value may be saved in tc_frag_data.length which is
11109 unsigned byte. */
11110 if (!fits_in_unsigned_byte (padding_size))
11111 abort ();
11112
11113 return padding_size;
11114 }
11115
11116 /* i386_generic_table_relax_frag()
11117
11118 Handle BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING frags to
11119 grow/shrink padding to align branch frags. Hand others to
11120 relax_frag(). */
11121
11122 long
11123 i386_generic_table_relax_frag (segT segment, fragS *fragP, long stretch)
11124 {
11125 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
11126 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
11127 {
11128 long padding_size = i386_branch_padding_size (fragP, 0);
11129 long grow = padding_size - fragP->tc_frag_data.length;
11130
11131 /* When the BRANCH_PREFIX frag is used, the computed address
11132 must match the actual address and there should be no padding. */
11133 if (fragP->tc_frag_data.padding_address
11134 && (fragP->tc_frag_data.padding_address != fragP->fr_address
11135 || padding_size))
11136 abort ();
11137
11138 /* Update the padding size. */
11139 if (grow)
11140 fragP->tc_frag_data.length = padding_size;
11141
11142 return grow;
11143 }
11144 else if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
11145 {
11146 fragS *padding_fragP, *next_fragP;
11147 long padding_size, left_size, last_size;
11148
11149 padding_fragP = fragP->tc_frag_data.u.padding_fragP;
11150 if (!padding_fragP)
11151 /* Use the padding set by the leading BRANCH_PREFIX frag. */
11152 return (fragP->tc_frag_data.length
11153 - fragP->tc_frag_data.last_length);
11154
11155 /* Compute the relative address of the padding frag in the very
11156 first time where the BRANCH_PREFIX frag sizes are zero. */
11157 if (!fragP->tc_frag_data.padding_address)
11158 fragP->tc_frag_data.padding_address
11159 = padding_fragP->fr_address - (fragP->fr_address - stretch);
11160
11161 /* First update the last length from the previous interation. */
11162 left_size = fragP->tc_frag_data.prefix_length;
11163 for (next_fragP = fragP;
11164 next_fragP != padding_fragP;
11165 next_fragP = next_fragP->fr_next)
11166 if (next_fragP->fr_type == rs_machine_dependent
11167 && (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11168 == BRANCH_PREFIX))
11169 {
11170 if (left_size)
11171 {
11172 int max = next_fragP->tc_frag_data.max_bytes;
11173 if (max)
11174 {
11175 int size;
11176 if (max > left_size)
11177 size = left_size;
11178 else
11179 size = max;
11180 left_size -= size;
11181 next_fragP->tc_frag_data.last_length = size;
11182 }
11183 }
11184 else
11185 next_fragP->tc_frag_data.last_length = 0;
11186 }
11187
11188 /* Check the padding size for the padding frag. */
11189 padding_size = i386_branch_padding_size
11190 (padding_fragP, (fragP->fr_address
11191 + fragP->tc_frag_data.padding_address));
11192
11193 last_size = fragP->tc_frag_data.prefix_length;
11194 /* Check if there is change from the last interation. */
11195 if (padding_size == last_size)
11196 {
11197 /* Update the expected address of the padding frag. */
11198 padding_fragP->tc_frag_data.padding_address
11199 = (fragP->fr_address + padding_size
11200 + fragP->tc_frag_data.padding_address);
11201 return 0;
11202 }
11203
11204 if (padding_size > fragP->tc_frag_data.max_prefix_length)
11205 {
11206 /* No padding if there is no sufficient room. Clear the
11207 expected address of the padding frag. */
11208 padding_fragP->tc_frag_data.padding_address = 0;
11209 padding_size = 0;
11210 }
11211 else
11212 /* Store the expected address of the padding frag. */
11213 padding_fragP->tc_frag_data.padding_address
11214 = (fragP->fr_address + padding_size
11215 + fragP->tc_frag_data.padding_address);
11216
11217 fragP->tc_frag_data.prefix_length = padding_size;
11218
11219 /* Update the length for the current interation. */
11220 left_size = padding_size;
11221 for (next_fragP = fragP;
11222 next_fragP != padding_fragP;
11223 next_fragP = next_fragP->fr_next)
11224 if (next_fragP->fr_type == rs_machine_dependent
11225 && (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11226 == BRANCH_PREFIX))
11227 {
11228 if (left_size)
11229 {
11230 int max = next_fragP->tc_frag_data.max_bytes;
11231 if (max)
11232 {
11233 int size;
11234 if (max > left_size)
11235 size = left_size;
11236 else
11237 size = max;
11238 left_size -= size;
11239 next_fragP->tc_frag_data.length = size;
11240 }
11241 }
11242 else
11243 next_fragP->tc_frag_data.length = 0;
11244 }
11245
11246 return (fragP->tc_frag_data.length
11247 - fragP->tc_frag_data.last_length);
11248 }
11249 return relax_frag (segment, fragP, stretch);
11250 }
11251
11252 /* md_estimate_size_before_relax()
11253
11254 Called just before relax() for rs_machine_dependent frags. The x86
11255 assembler uses these frags to handle variable size jump
11256 instructions.
11257
11258 Any symbol that is now undefined will not become defined.
11259 Return the correct fr_subtype in the frag.
11260 Return the initial "guess for variable size of frag" to caller.
11261 The guess is actually the growth beyond the fixed part. Whatever
11262 we do to grow the fixed or variable part contributes to our
11263 returned value. */
11264
11265 int
11266 md_estimate_size_before_relax (fragS *fragP, segT segment)
11267 {
11268 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
11269 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX
11270 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
11271 {
11272 i386_classify_machine_dependent_frag (fragP);
11273 return fragP->tc_frag_data.length;
11274 }
11275
11276 /* We've already got fragP->fr_subtype right; all we have to do is
11277 check for un-relaxable symbols. On an ELF system, we can't relax
11278 an externally visible symbol, because it may be overridden by a
11279 shared library. */
11280 if (S_GET_SEGMENT (fragP->fr_symbol) != segment
11281 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11282 || (IS_ELF
11283 && !elf_symbol_resolved_in_segment_p (fragP->fr_symbol,
11284 fragP->fr_var))
11285 #endif
11286 #if defined (OBJ_COFF) && defined (TE_PE)
11287 || (OUTPUT_FLAVOR == bfd_target_coff_flavour
11288 && S_IS_WEAK (fragP->fr_symbol))
11289 #endif
11290 )
11291 {
11292 /* Symbol is undefined in this segment, or we need to keep a
11293 reloc so that weak symbols can be overridden. */
11294 int size = (fragP->fr_subtype & CODE16) ? 2 : 4;
11295 enum bfd_reloc_code_real reloc_type;
11296 unsigned char *opcode;
11297 int old_fr_fix;
11298
11299 if (fragP->fr_var != NO_RELOC)
11300 reloc_type = (enum bfd_reloc_code_real) fragP->fr_var;
11301 else if (size == 2)
11302 reloc_type = BFD_RELOC_16_PCREL;
11303 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11304 else if (need_plt32_p (fragP->fr_symbol))
11305 reloc_type = BFD_RELOC_X86_64_PLT32;
11306 #endif
11307 else
11308 reloc_type = BFD_RELOC_32_PCREL;
11309
11310 old_fr_fix = fragP->fr_fix;
11311 opcode = (unsigned char *) fragP->fr_opcode;
11312
11313 switch (TYPE_FROM_RELAX_STATE (fragP->fr_subtype))
11314 {
11315 case UNCOND_JUMP:
11316 /* Make jmp (0xeb) a (d)word displacement jump. */
11317 opcode[0] = 0xe9;
11318 fragP->fr_fix += size;
11319 fix_new (fragP, old_fr_fix, size,
11320 fragP->fr_symbol,
11321 fragP->fr_offset, 1,
11322 reloc_type);
11323 break;
11324
11325 case COND_JUMP86:
11326 if (size == 2
11327 && (!no_cond_jump_promotion || fragP->fr_var != NO_RELOC))
11328 {
11329 /* Negate the condition, and branch past an
11330 unconditional jump. */
11331 opcode[0] ^= 1;
11332 opcode[1] = 3;
11333 /* Insert an unconditional jump. */
11334 opcode[2] = 0xe9;
11335 /* We added two extra opcode bytes, and have a two byte
11336 offset. */
11337 fragP->fr_fix += 2 + 2;
11338 fix_new (fragP, old_fr_fix + 2, 2,
11339 fragP->fr_symbol,
11340 fragP->fr_offset, 1,
11341 reloc_type);
11342 break;
11343 }
11344 /* Fall through. */
11345
11346 case COND_JUMP:
11347 if (no_cond_jump_promotion && fragP->fr_var == NO_RELOC)
11348 {
11349 fixS *fixP;
11350
11351 fragP->fr_fix += 1;
11352 fixP = fix_new (fragP, old_fr_fix, 1,
11353 fragP->fr_symbol,
11354 fragP->fr_offset, 1,
11355 BFD_RELOC_8_PCREL);
11356 fixP->fx_signed = 1;
11357 break;
11358 }
11359
11360 /* This changes the byte-displacement jump 0x7N
11361 to the (d)word-displacement jump 0x0f,0x8N. */
11362 opcode[1] = opcode[0] + 0x10;
11363 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
11364 /* We've added an opcode byte. */
11365 fragP->fr_fix += 1 + size;
11366 fix_new (fragP, old_fr_fix + 1, size,
11367 fragP->fr_symbol,
11368 fragP->fr_offset, 1,
11369 reloc_type);
11370 break;
11371
11372 default:
11373 BAD_CASE (fragP->fr_subtype);
11374 break;
11375 }
11376 frag_wane (fragP);
11377 return fragP->fr_fix - old_fr_fix;
11378 }
11379
11380 /* Guess size depending on current relax state. Initially the relax
11381 state will correspond to a short jump and we return 1, because
11382 the variable part of the frag (the branch offset) is one byte
11383 long. However, we can relax a section more than once and in that
11384 case we must either set fr_subtype back to the unrelaxed state,
11385 or return the value for the appropriate branch. */
11386 return md_relax_table[fragP->fr_subtype].rlx_length;
11387 }
11388
11389 /* Called after relax() is finished.
11390
11391 In: Address of frag.
11392 fr_type == rs_machine_dependent.
11393 fr_subtype is what the address relaxed to.
11394
11395 Out: Any fixSs and constants are set up.
11396 Caller will turn frag into a ".space 0". */
11397
11398 void
11399 md_convert_frag (bfd *abfd ATTRIBUTE_UNUSED, segT sec ATTRIBUTE_UNUSED,
11400 fragS *fragP)
11401 {
11402 unsigned char *opcode;
11403 unsigned char *where_to_put_displacement = NULL;
11404 offsetT target_address;
11405 offsetT opcode_address;
11406 unsigned int extension = 0;
11407 offsetT displacement_from_opcode_start;
11408
11409 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
11410 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING
11411 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
11412 {
11413 /* Generate nop padding. */
11414 unsigned int size = fragP->tc_frag_data.length;
11415 if (size)
11416 {
11417 if (size > fragP->tc_frag_data.max_bytes)
11418 abort ();
11419
11420 if (flag_debug)
11421 {
11422 const char *msg;
11423 const char *branch = "branch";
11424 const char *prefix = "";
11425 fragS *padding_fragP;
11426 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
11427 == BRANCH_PREFIX)
11428 {
11429 padding_fragP = fragP->tc_frag_data.u.padding_fragP;
11430 switch (fragP->tc_frag_data.default_prefix)
11431 {
11432 default:
11433 abort ();
11434 break;
11435 case CS_PREFIX_OPCODE:
11436 prefix = " cs";
11437 break;
11438 case DS_PREFIX_OPCODE:
11439 prefix = " ds";
11440 break;
11441 case ES_PREFIX_OPCODE:
11442 prefix = " es";
11443 break;
11444 case FS_PREFIX_OPCODE:
11445 prefix = " fs";
11446 break;
11447 case GS_PREFIX_OPCODE:
11448 prefix = " gs";
11449 break;
11450 case SS_PREFIX_OPCODE:
11451 prefix = " ss";
11452 break;
11453 }
11454 if (padding_fragP)
11455 msg = _("%s:%u: add %d%s at 0x%llx to align "
11456 "%s within %d-byte boundary\n");
11457 else
11458 msg = _("%s:%u: add additional %d%s at 0x%llx to "
11459 "align %s within %d-byte boundary\n");
11460 }
11461 else
11462 {
11463 padding_fragP = fragP;
11464 msg = _("%s:%u: add %d%s-byte nop at 0x%llx to align "
11465 "%s within %d-byte boundary\n");
11466 }
11467
11468 if (padding_fragP)
11469 switch (padding_fragP->tc_frag_data.branch_type)
11470 {
11471 case align_branch_jcc:
11472 branch = "jcc";
11473 break;
11474 case align_branch_fused:
11475 branch = "fused jcc";
11476 break;
11477 case align_branch_jmp:
11478 branch = "jmp";
11479 break;
11480 case align_branch_call:
11481 branch = "call";
11482 break;
11483 case align_branch_indirect:
11484 branch = "indiret branch";
11485 break;
11486 case align_branch_ret:
11487 branch = "ret";
11488 break;
11489 default:
11490 break;
11491 }
11492
11493 fprintf (stdout, msg,
11494 fragP->fr_file, fragP->fr_line, size, prefix,
11495 (long long) fragP->fr_address, branch,
11496 1 << align_branch_power);
11497 }
11498 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
11499 memset (fragP->fr_opcode,
11500 fragP->tc_frag_data.default_prefix, size);
11501 else
11502 i386_generate_nops (fragP, (char *) fragP->fr_opcode,
11503 size, 0);
11504 fragP->fr_fix += size;
11505 }
11506 return;
11507 }
11508
11509 opcode = (unsigned char *) fragP->fr_opcode;
11510
11511 /* Address we want to reach in file space. */
11512 target_address = S_GET_VALUE (fragP->fr_symbol) + fragP->fr_offset;
11513
11514 /* Address opcode resides at in file space. */
11515 opcode_address = fragP->fr_address + fragP->fr_fix;
11516
11517 /* Displacement from opcode start to fill into instruction. */
11518 displacement_from_opcode_start = target_address - opcode_address;
11519
11520 if ((fragP->fr_subtype & BIG) == 0)
11521 {
11522 /* Don't have to change opcode. */
11523 extension = 1; /* 1 opcode + 1 displacement */
11524 where_to_put_displacement = &opcode[1];
11525 }
11526 else
11527 {
11528 if (no_cond_jump_promotion
11529 && TYPE_FROM_RELAX_STATE (fragP->fr_subtype) != UNCOND_JUMP)
11530 as_warn_where (fragP->fr_file, fragP->fr_line,
11531 _("long jump required"));
11532
11533 switch (fragP->fr_subtype)
11534 {
11535 case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG):
11536 extension = 4; /* 1 opcode + 4 displacement */
11537 opcode[0] = 0xe9;
11538 where_to_put_displacement = &opcode[1];
11539 break;
11540
11541 case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16):
11542 extension = 2; /* 1 opcode + 2 displacement */
11543 opcode[0] = 0xe9;
11544 where_to_put_displacement = &opcode[1];
11545 break;
11546
11547 case ENCODE_RELAX_STATE (COND_JUMP, BIG):
11548 case ENCODE_RELAX_STATE (COND_JUMP86, BIG):
11549 extension = 5; /* 2 opcode + 4 displacement */
11550 opcode[1] = opcode[0] + 0x10;
11551 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
11552 where_to_put_displacement = &opcode[2];
11553 break;
11554
11555 case ENCODE_RELAX_STATE (COND_JUMP, BIG16):
11556 extension = 3; /* 2 opcode + 2 displacement */
11557 opcode[1] = opcode[0] + 0x10;
11558 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
11559 where_to_put_displacement = &opcode[2];
11560 break;
11561
11562 case ENCODE_RELAX_STATE (COND_JUMP86, BIG16):
11563 extension = 4;
11564 opcode[0] ^= 1;
11565 opcode[1] = 3;
11566 opcode[2] = 0xe9;
11567 where_to_put_displacement = &opcode[3];
11568 break;
11569
11570 default:
11571 BAD_CASE (fragP->fr_subtype);
11572 break;
11573 }
11574 }
11575
11576 /* If size if less then four we are sure that the operand fits,
11577 but if it's 4, then it could be that the displacement is larger
11578 then -/+ 2GB. */
11579 if (DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype) == 4
11580 && object_64bit
11581 && ((addressT) (displacement_from_opcode_start - extension
11582 + ((addressT) 1 << 31))
11583 > (((addressT) 2 << 31) - 1)))
11584 {
11585 as_bad_where (fragP->fr_file, fragP->fr_line,
11586 _("jump target out of range"));
11587 /* Make us emit 0. */
11588 displacement_from_opcode_start = extension;
11589 }
11590 /* Now put displacement after opcode. */
11591 md_number_to_chars ((char *) where_to_put_displacement,
11592 (valueT) (displacement_from_opcode_start - extension),
11593 DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype));
11594 fragP->fr_fix += extension;
11595 }
11596 \f
11597 /* Apply a fixup (fixP) to segment data, once it has been determined
11598 by our caller that we have all the info we need to fix it up.
11599
11600 Parameter valP is the pointer to the value of the bits.
11601
11602 On the 386, immediates, displacements, and data pointers are all in
11603 the same (little-endian) format, so we don't need to care about which
11604 we are handling. */
11605
11606 void
11607 md_apply_fix (fixS *fixP, valueT *valP, segT seg ATTRIBUTE_UNUSED)
11608 {
11609 char *p = fixP->fx_where + fixP->fx_frag->fr_literal;
11610 valueT value = *valP;
11611
11612 #if !defined (TE_Mach)
11613 if (fixP->fx_pcrel)
11614 {
11615 switch (fixP->fx_r_type)
11616 {
11617 default:
11618 break;
11619
11620 case BFD_RELOC_64:
11621 fixP->fx_r_type = BFD_RELOC_64_PCREL;
11622 break;
11623 case BFD_RELOC_32:
11624 case BFD_RELOC_X86_64_32S:
11625 fixP->fx_r_type = BFD_RELOC_32_PCREL;
11626 break;
11627 case BFD_RELOC_16:
11628 fixP->fx_r_type = BFD_RELOC_16_PCREL;
11629 break;
11630 case BFD_RELOC_8:
11631 fixP->fx_r_type = BFD_RELOC_8_PCREL;
11632 break;
11633 }
11634 }
11635
11636 if (fixP->fx_addsy != NULL
11637 && (fixP->fx_r_type == BFD_RELOC_32_PCREL
11638 || fixP->fx_r_type == BFD_RELOC_64_PCREL
11639 || fixP->fx_r_type == BFD_RELOC_16_PCREL
11640 || fixP->fx_r_type == BFD_RELOC_8_PCREL)
11641 && !use_rela_relocations)
11642 {
11643 /* This is a hack. There should be a better way to handle this.
11644 This covers for the fact that bfd_install_relocation will
11645 subtract the current location (for partial_inplace, PC relative
11646 relocations); see more below. */
11647 #ifndef OBJ_AOUT
11648 if (IS_ELF
11649 #ifdef TE_PE
11650 || OUTPUT_FLAVOR == bfd_target_coff_flavour
11651 #endif
11652 )
11653 value += fixP->fx_where + fixP->fx_frag->fr_address;
11654 #endif
11655 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11656 if (IS_ELF)
11657 {
11658 segT sym_seg = S_GET_SEGMENT (fixP->fx_addsy);
11659
11660 if ((sym_seg == seg
11661 || (symbol_section_p (fixP->fx_addsy)
11662 && sym_seg != absolute_section))
11663 && !generic_force_reloc (fixP))
11664 {
11665 /* Yes, we add the values in twice. This is because
11666 bfd_install_relocation subtracts them out again. I think
11667 bfd_install_relocation is broken, but I don't dare change
11668 it. FIXME. */
11669 value += fixP->fx_where + fixP->fx_frag->fr_address;
11670 }
11671 }
11672 #endif
11673 #if defined (OBJ_COFF) && defined (TE_PE)
11674 /* For some reason, the PE format does not store a
11675 section address offset for a PC relative symbol. */
11676 if (S_GET_SEGMENT (fixP->fx_addsy) != seg
11677 || S_IS_WEAK (fixP->fx_addsy))
11678 value += md_pcrel_from (fixP);
11679 #endif
11680 }
11681 #if defined (OBJ_COFF) && defined (TE_PE)
11682 if (fixP->fx_addsy != NULL
11683 && S_IS_WEAK (fixP->fx_addsy)
11684 /* PR 16858: Do not modify weak function references. */
11685 && ! fixP->fx_pcrel)
11686 {
11687 #if !defined (TE_PEP)
11688 /* For x86 PE weak function symbols are neither PC-relative
11689 nor do they set S_IS_FUNCTION. So the only reliable way
11690 to detect them is to check the flags of their containing
11691 section. */
11692 if (S_GET_SEGMENT (fixP->fx_addsy) != NULL
11693 && S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_CODE)
11694 ;
11695 else
11696 #endif
11697 value -= S_GET_VALUE (fixP->fx_addsy);
11698 }
11699 #endif
11700
11701 /* Fix a few things - the dynamic linker expects certain values here,
11702 and we must not disappoint it. */
11703 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11704 if (IS_ELF && fixP->fx_addsy)
11705 switch (fixP->fx_r_type)
11706 {
11707 case BFD_RELOC_386_PLT32:
11708 case BFD_RELOC_X86_64_PLT32:
11709 /* Make the jump instruction point to the address of the operand.
11710 At runtime we merely add the offset to the actual PLT entry.
11711 NB: Subtract the offset size only for jump instructions. */
11712 if (fixP->fx_pcrel)
11713 value = -4;
11714 break;
11715
11716 case BFD_RELOC_386_TLS_GD:
11717 case BFD_RELOC_386_TLS_LDM:
11718 case BFD_RELOC_386_TLS_IE_32:
11719 case BFD_RELOC_386_TLS_IE:
11720 case BFD_RELOC_386_TLS_GOTIE:
11721 case BFD_RELOC_386_TLS_GOTDESC:
11722 case BFD_RELOC_X86_64_TLSGD:
11723 case BFD_RELOC_X86_64_TLSLD:
11724 case BFD_RELOC_X86_64_GOTTPOFF:
11725 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
11726 value = 0; /* Fully resolved at runtime. No addend. */
11727 /* Fallthrough */
11728 case BFD_RELOC_386_TLS_LE:
11729 case BFD_RELOC_386_TLS_LDO_32:
11730 case BFD_RELOC_386_TLS_LE_32:
11731 case BFD_RELOC_X86_64_DTPOFF32:
11732 case BFD_RELOC_X86_64_DTPOFF64:
11733 case BFD_RELOC_X86_64_TPOFF32:
11734 case BFD_RELOC_X86_64_TPOFF64:
11735 S_SET_THREAD_LOCAL (fixP->fx_addsy);
11736 break;
11737
11738 case BFD_RELOC_386_TLS_DESC_CALL:
11739 case BFD_RELOC_X86_64_TLSDESC_CALL:
11740 value = 0; /* Fully resolved at runtime. No addend. */
11741 S_SET_THREAD_LOCAL (fixP->fx_addsy);
11742 fixP->fx_done = 0;
11743 return;
11744
11745 case BFD_RELOC_VTABLE_INHERIT:
11746 case BFD_RELOC_VTABLE_ENTRY:
11747 fixP->fx_done = 0;
11748 return;
11749
11750 default:
11751 break;
11752 }
11753 #endif /* defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) */
11754 *valP = value;
11755 #endif /* !defined (TE_Mach) */
11756
11757 /* Are we finished with this relocation now? */
11758 if (fixP->fx_addsy == NULL)
11759 fixP->fx_done = 1;
11760 #if defined (OBJ_COFF) && defined (TE_PE)
11761 else if (fixP->fx_addsy != NULL && S_IS_WEAK (fixP->fx_addsy))
11762 {
11763 fixP->fx_done = 0;
11764 /* Remember value for tc_gen_reloc. */
11765 fixP->fx_addnumber = value;
11766 /* Clear out the frag for now. */
11767 value = 0;
11768 }
11769 #endif
11770 else if (use_rela_relocations)
11771 {
11772 fixP->fx_no_overflow = 1;
11773 /* Remember value for tc_gen_reloc. */
11774 fixP->fx_addnumber = value;
11775 value = 0;
11776 }
11777
11778 md_number_to_chars (p, value, fixP->fx_size);
11779 }
11780 \f
11781 const char *
11782 md_atof (int type, char *litP, int *sizeP)
11783 {
11784 /* This outputs the LITTLENUMs in REVERSE order;
11785 in accord with the bigendian 386. */
11786 return ieee_md_atof (type, litP, sizeP, FALSE);
11787 }
11788 \f
11789 static char output_invalid_buf[sizeof (unsigned char) * 2 + 6];
11790
11791 static char *
11792 output_invalid (int c)
11793 {
11794 if (ISPRINT (c))
11795 snprintf (output_invalid_buf, sizeof (output_invalid_buf),
11796 "'%c'", c);
11797 else
11798 snprintf (output_invalid_buf, sizeof (output_invalid_buf),
11799 "(0x%x)", (unsigned char) c);
11800 return output_invalid_buf;
11801 }
11802
11803 /* REG_STRING starts *before* REGISTER_PREFIX. */
11804
11805 static const reg_entry *
11806 parse_real_register (char *reg_string, char **end_op)
11807 {
11808 char *s = reg_string;
11809 char *p;
11810 char reg_name_given[MAX_REG_NAME_SIZE + 1];
11811 const reg_entry *r;
11812
11813 /* Skip possible REGISTER_PREFIX and possible whitespace. */
11814 if (*s == REGISTER_PREFIX)
11815 ++s;
11816
11817 if (is_space_char (*s))
11818 ++s;
11819
11820 p = reg_name_given;
11821 while ((*p++ = register_chars[(unsigned char) *s]) != '\0')
11822 {
11823 if (p >= reg_name_given + MAX_REG_NAME_SIZE)
11824 return (const reg_entry *) NULL;
11825 s++;
11826 }
11827
11828 /* For naked regs, make sure that we are not dealing with an identifier.
11829 This prevents confusing an identifier like `eax_var' with register
11830 `eax'. */
11831 if (allow_naked_reg && identifier_chars[(unsigned char) *s])
11832 return (const reg_entry *) NULL;
11833
11834 *end_op = s;
11835
11836 r = (const reg_entry *) hash_find (reg_hash, reg_name_given);
11837
11838 /* Handle floating point regs, allowing spaces in the (i) part. */
11839 if (r == i386_regtab /* %st is first entry of table */)
11840 {
11841 if (!cpu_arch_flags.bitfield.cpu8087
11842 && !cpu_arch_flags.bitfield.cpu287
11843 && !cpu_arch_flags.bitfield.cpu387)
11844 return (const reg_entry *) NULL;
11845
11846 if (is_space_char (*s))
11847 ++s;
11848 if (*s == '(')
11849 {
11850 ++s;
11851 if (is_space_char (*s))
11852 ++s;
11853 if (*s >= '0' && *s <= '7')
11854 {
11855 int fpr = *s - '0';
11856 ++s;
11857 if (is_space_char (*s))
11858 ++s;
11859 if (*s == ')')
11860 {
11861 *end_op = s + 1;
11862 r = (const reg_entry *) hash_find (reg_hash, "st(0)");
11863 know (r);
11864 return r + fpr;
11865 }
11866 }
11867 /* We have "%st(" then garbage. */
11868 return (const reg_entry *) NULL;
11869 }
11870 }
11871
11872 if (r == NULL || allow_pseudo_reg)
11873 return r;
11874
11875 if (operand_type_all_zero (&r->reg_type))
11876 return (const reg_entry *) NULL;
11877
11878 if ((r->reg_type.bitfield.dword
11879 || (r->reg_type.bitfield.class == SReg && r->reg_num > 3)
11880 || r->reg_type.bitfield.class == RegCR
11881 || r->reg_type.bitfield.class == RegDR
11882 || r->reg_type.bitfield.class == RegTR)
11883 && !cpu_arch_flags.bitfield.cpui386)
11884 return (const reg_entry *) NULL;
11885
11886 if (r->reg_type.bitfield.class == RegMMX && !cpu_arch_flags.bitfield.cpummx)
11887 return (const reg_entry *) NULL;
11888
11889 if (!cpu_arch_flags.bitfield.cpuavx512f)
11890 {
11891 if (r->reg_type.bitfield.zmmword
11892 || r->reg_type.bitfield.class == RegMask)
11893 return (const reg_entry *) NULL;
11894
11895 if (!cpu_arch_flags.bitfield.cpuavx)
11896 {
11897 if (r->reg_type.bitfield.ymmword)
11898 return (const reg_entry *) NULL;
11899
11900 if (!cpu_arch_flags.bitfield.cpusse && r->reg_type.bitfield.xmmword)
11901 return (const reg_entry *) NULL;
11902 }
11903 }
11904
11905 if (r->reg_type.bitfield.class == RegBND && !cpu_arch_flags.bitfield.cpumpx)
11906 return (const reg_entry *) NULL;
11907
11908 /* Don't allow fake index register unless allow_index_reg isn't 0. */
11909 if (!allow_index_reg && r->reg_num == RegIZ)
11910 return (const reg_entry *) NULL;
11911
11912 /* Upper 16 vector registers are only available with VREX in 64bit
11913 mode, and require EVEX encoding. */
11914 if (r->reg_flags & RegVRex)
11915 {
11916 if (!cpu_arch_flags.bitfield.cpuavx512f
11917 || flag_code != CODE_64BIT)
11918 return (const reg_entry *) NULL;
11919
11920 i.vec_encoding = vex_encoding_evex;
11921 }
11922
11923 if (((r->reg_flags & (RegRex64 | RegRex)) || r->reg_type.bitfield.qword)
11924 && (!cpu_arch_flags.bitfield.cpulm || r->reg_type.bitfield.class != RegCR)
11925 && flag_code != CODE_64BIT)
11926 return (const reg_entry *) NULL;
11927
11928 if (r->reg_type.bitfield.class == SReg && r->reg_num == RegFlat
11929 && !intel_syntax)
11930 return (const reg_entry *) NULL;
11931
11932 return r;
11933 }
11934
11935 /* REG_STRING starts *before* REGISTER_PREFIX. */
11936
11937 static const reg_entry *
11938 parse_register (char *reg_string, char **end_op)
11939 {
11940 const reg_entry *r;
11941
11942 if (*reg_string == REGISTER_PREFIX || allow_naked_reg)
11943 r = parse_real_register (reg_string, end_op);
11944 else
11945 r = NULL;
11946 if (!r)
11947 {
11948 char *save = input_line_pointer;
11949 char c;
11950 symbolS *symbolP;
11951
11952 input_line_pointer = reg_string;
11953 c = get_symbol_name (&reg_string);
11954 symbolP = symbol_find (reg_string);
11955 if (symbolP && S_GET_SEGMENT (symbolP) == reg_section)
11956 {
11957 const expressionS *e = symbol_get_value_expression (symbolP);
11958
11959 know (e->X_op == O_register);
11960 know (e->X_add_number >= 0
11961 && (valueT) e->X_add_number < i386_regtab_size);
11962 r = i386_regtab + e->X_add_number;
11963 if ((r->reg_flags & RegVRex))
11964 i.vec_encoding = vex_encoding_evex;
11965 *end_op = input_line_pointer;
11966 }
11967 *input_line_pointer = c;
11968 input_line_pointer = save;
11969 }
11970 return r;
11971 }
11972
11973 int
11974 i386_parse_name (char *name, expressionS *e, char *nextcharP)
11975 {
11976 const reg_entry *r;
11977 char *end = input_line_pointer;
11978
11979 *end = *nextcharP;
11980 r = parse_register (name, &input_line_pointer);
11981 if (r && end <= input_line_pointer)
11982 {
11983 *nextcharP = *input_line_pointer;
11984 *input_line_pointer = 0;
11985 e->X_op = O_register;
11986 e->X_add_number = r - i386_regtab;
11987 return 1;
11988 }
11989 input_line_pointer = end;
11990 *end = 0;
11991 return intel_syntax ? i386_intel_parse_name (name, e) : 0;
11992 }
11993
11994 void
11995 md_operand (expressionS *e)
11996 {
11997 char *end;
11998 const reg_entry *r;
11999
12000 switch (*input_line_pointer)
12001 {
12002 case REGISTER_PREFIX:
12003 r = parse_real_register (input_line_pointer, &end);
12004 if (r)
12005 {
12006 e->X_op = O_register;
12007 e->X_add_number = r - i386_regtab;
12008 input_line_pointer = end;
12009 }
12010 break;
12011
12012 case '[':
12013 gas_assert (intel_syntax);
12014 end = input_line_pointer++;
12015 expression (e);
12016 if (*input_line_pointer == ']')
12017 {
12018 ++input_line_pointer;
12019 e->X_op_symbol = make_expr_symbol (e);
12020 e->X_add_symbol = NULL;
12021 e->X_add_number = 0;
12022 e->X_op = O_index;
12023 }
12024 else
12025 {
12026 e->X_op = O_absent;
12027 input_line_pointer = end;
12028 }
12029 break;
12030 }
12031 }
12032
12033 \f
12034 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12035 const char *md_shortopts = "kVQ:sqnO::";
12036 #else
12037 const char *md_shortopts = "qnO::";
12038 #endif
12039
12040 #define OPTION_32 (OPTION_MD_BASE + 0)
12041 #define OPTION_64 (OPTION_MD_BASE + 1)
12042 #define OPTION_DIVIDE (OPTION_MD_BASE + 2)
12043 #define OPTION_MARCH (OPTION_MD_BASE + 3)
12044 #define OPTION_MTUNE (OPTION_MD_BASE + 4)
12045 #define OPTION_MMNEMONIC (OPTION_MD_BASE + 5)
12046 #define OPTION_MSYNTAX (OPTION_MD_BASE + 6)
12047 #define OPTION_MINDEX_REG (OPTION_MD_BASE + 7)
12048 #define OPTION_MNAKED_REG (OPTION_MD_BASE + 8)
12049 #define OPTION_MRELAX_RELOCATIONS (OPTION_MD_BASE + 9)
12050 #define OPTION_MSSE2AVX (OPTION_MD_BASE + 10)
12051 #define OPTION_MSSE_CHECK (OPTION_MD_BASE + 11)
12052 #define OPTION_MOPERAND_CHECK (OPTION_MD_BASE + 12)
12053 #define OPTION_MAVXSCALAR (OPTION_MD_BASE + 13)
12054 #define OPTION_X32 (OPTION_MD_BASE + 14)
12055 #define OPTION_MADD_BND_PREFIX (OPTION_MD_BASE + 15)
12056 #define OPTION_MEVEXLIG (OPTION_MD_BASE + 16)
12057 #define OPTION_MEVEXWIG (OPTION_MD_BASE + 17)
12058 #define OPTION_MBIG_OBJ (OPTION_MD_BASE + 18)
12059 #define OPTION_MOMIT_LOCK_PREFIX (OPTION_MD_BASE + 19)
12060 #define OPTION_MEVEXRCIG (OPTION_MD_BASE + 20)
12061 #define OPTION_MSHARED (OPTION_MD_BASE + 21)
12062 #define OPTION_MAMD64 (OPTION_MD_BASE + 22)
12063 #define OPTION_MINTEL64 (OPTION_MD_BASE + 23)
12064 #define OPTION_MFENCE_AS_LOCK_ADD (OPTION_MD_BASE + 24)
12065 #define OPTION_X86_USED_NOTE (OPTION_MD_BASE + 25)
12066 #define OPTION_MVEXWIG (OPTION_MD_BASE + 26)
12067 #define OPTION_MALIGN_BRANCH_BOUNDARY (OPTION_MD_BASE + 27)
12068 #define OPTION_MALIGN_BRANCH_PREFIX_SIZE (OPTION_MD_BASE + 28)
12069 #define OPTION_MALIGN_BRANCH (OPTION_MD_BASE + 29)
12070 #define OPTION_MBRANCHES_WITH_32B_BOUNDARIES (OPTION_MD_BASE + 30)
12071
12072 struct option md_longopts[] =
12073 {
12074 {"32", no_argument, NULL, OPTION_32},
12075 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
12076 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
12077 {"64", no_argument, NULL, OPTION_64},
12078 #endif
12079 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12080 {"x32", no_argument, NULL, OPTION_X32},
12081 {"mshared", no_argument, NULL, OPTION_MSHARED},
12082 {"mx86-used-note", required_argument, NULL, OPTION_X86_USED_NOTE},
12083 #endif
12084 {"divide", no_argument, NULL, OPTION_DIVIDE},
12085 {"march", required_argument, NULL, OPTION_MARCH},
12086 {"mtune", required_argument, NULL, OPTION_MTUNE},
12087 {"mmnemonic", required_argument, NULL, OPTION_MMNEMONIC},
12088 {"msyntax", required_argument, NULL, OPTION_MSYNTAX},
12089 {"mindex-reg", no_argument, NULL, OPTION_MINDEX_REG},
12090 {"mnaked-reg", no_argument, NULL, OPTION_MNAKED_REG},
12091 {"msse2avx", no_argument, NULL, OPTION_MSSE2AVX},
12092 {"msse-check", required_argument, NULL, OPTION_MSSE_CHECK},
12093 {"moperand-check", required_argument, NULL, OPTION_MOPERAND_CHECK},
12094 {"mavxscalar", required_argument, NULL, OPTION_MAVXSCALAR},
12095 {"mvexwig", required_argument, NULL, OPTION_MVEXWIG},
12096 {"madd-bnd-prefix", no_argument, NULL, OPTION_MADD_BND_PREFIX},
12097 {"mevexlig", required_argument, NULL, OPTION_MEVEXLIG},
12098 {"mevexwig", required_argument, NULL, OPTION_MEVEXWIG},
12099 # if defined (TE_PE) || defined (TE_PEP)
12100 {"mbig-obj", no_argument, NULL, OPTION_MBIG_OBJ},
12101 #endif
12102 {"momit-lock-prefix", required_argument, NULL, OPTION_MOMIT_LOCK_PREFIX},
12103 {"mfence-as-lock-add", required_argument, NULL, OPTION_MFENCE_AS_LOCK_ADD},
12104 {"mrelax-relocations", required_argument, NULL, OPTION_MRELAX_RELOCATIONS},
12105 {"mevexrcig", required_argument, NULL, OPTION_MEVEXRCIG},
12106 {"malign-branch-boundary", required_argument, NULL, OPTION_MALIGN_BRANCH_BOUNDARY},
12107 {"malign-branch-prefix-size", required_argument, NULL, OPTION_MALIGN_BRANCH_PREFIX_SIZE},
12108 {"malign-branch", required_argument, NULL, OPTION_MALIGN_BRANCH},
12109 {"mbranches-within-32B-boundaries", no_argument, NULL, OPTION_MBRANCHES_WITH_32B_BOUNDARIES},
12110 {"mamd64", no_argument, NULL, OPTION_MAMD64},
12111 {"mintel64", no_argument, NULL, OPTION_MINTEL64},
12112 {NULL, no_argument, NULL, 0}
12113 };
12114 size_t md_longopts_size = sizeof (md_longopts);
12115
12116 int
12117 md_parse_option (int c, const char *arg)
12118 {
12119 unsigned int j;
12120 char *arch, *next, *saved, *type;
12121
12122 switch (c)
12123 {
12124 case 'n':
12125 optimize_align_code = 0;
12126 break;
12127
12128 case 'q':
12129 quiet_warnings = 1;
12130 break;
12131
12132 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12133 /* -Qy, -Qn: SVR4 arguments controlling whether a .comment section
12134 should be emitted or not. FIXME: Not implemented. */
12135 case 'Q':
12136 if ((arg[0] != 'y' && arg[0] != 'n') || arg[1])
12137 return 0;
12138 break;
12139
12140 /* -V: SVR4 argument to print version ID. */
12141 case 'V':
12142 print_version_id ();
12143 break;
12144
12145 /* -k: Ignore for FreeBSD compatibility. */
12146 case 'k':
12147 break;
12148
12149 case 's':
12150 /* -s: On i386 Solaris, this tells the native assembler to use
12151 .stab instead of .stab.excl. We always use .stab anyhow. */
12152 break;
12153
12154 case OPTION_MSHARED:
12155 shared = 1;
12156 break;
12157
12158 case OPTION_X86_USED_NOTE:
12159 if (strcasecmp (arg, "yes") == 0)
12160 x86_used_note = 1;
12161 else if (strcasecmp (arg, "no") == 0)
12162 x86_used_note = 0;
12163 else
12164 as_fatal (_("invalid -mx86-used-note= option: `%s'"), arg);
12165 break;
12166
12167
12168 #endif
12169 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
12170 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
12171 case OPTION_64:
12172 {
12173 const char **list, **l;
12174
12175 list = bfd_target_list ();
12176 for (l = list; *l != NULL; l++)
12177 if (CONST_STRNEQ (*l, "elf64-x86-64")
12178 || strcmp (*l, "coff-x86-64") == 0
12179 || strcmp (*l, "pe-x86-64") == 0
12180 || strcmp (*l, "pei-x86-64") == 0
12181 || strcmp (*l, "mach-o-x86-64") == 0)
12182 {
12183 default_arch = "x86_64";
12184 break;
12185 }
12186 if (*l == NULL)
12187 as_fatal (_("no compiled in support for x86_64"));
12188 free (list);
12189 }
12190 break;
12191 #endif
12192
12193 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12194 case OPTION_X32:
12195 if (IS_ELF)
12196 {
12197 const char **list, **l;
12198
12199 list = bfd_target_list ();
12200 for (l = list; *l != NULL; l++)
12201 if (CONST_STRNEQ (*l, "elf32-x86-64"))
12202 {
12203 default_arch = "x86_64:32";
12204 break;
12205 }
12206 if (*l == NULL)
12207 as_fatal (_("no compiled in support for 32bit x86_64"));
12208 free (list);
12209 }
12210 else
12211 as_fatal (_("32bit x86_64 is only supported for ELF"));
12212 break;
12213 #endif
12214
12215 case OPTION_32:
12216 default_arch = "i386";
12217 break;
12218
12219 case OPTION_DIVIDE:
12220 #ifdef SVR4_COMMENT_CHARS
12221 {
12222 char *n, *t;
12223 const char *s;
12224
12225 n = XNEWVEC (char, strlen (i386_comment_chars) + 1);
12226 t = n;
12227 for (s = i386_comment_chars; *s != '\0'; s++)
12228 if (*s != '/')
12229 *t++ = *s;
12230 *t = '\0';
12231 i386_comment_chars = n;
12232 }
12233 #endif
12234 break;
12235
12236 case OPTION_MARCH:
12237 saved = xstrdup (arg);
12238 arch = saved;
12239 /* Allow -march=+nosse. */
12240 if (*arch == '+')
12241 arch++;
12242 do
12243 {
12244 if (*arch == '.')
12245 as_fatal (_("invalid -march= option: `%s'"), arg);
12246 next = strchr (arch, '+');
12247 if (next)
12248 *next++ = '\0';
12249 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
12250 {
12251 if (strcmp (arch, cpu_arch [j].name) == 0)
12252 {
12253 /* Processor. */
12254 if (! cpu_arch[j].flags.bitfield.cpui386)
12255 continue;
12256
12257 cpu_arch_name = cpu_arch[j].name;
12258 cpu_sub_arch_name = NULL;
12259 cpu_arch_flags = cpu_arch[j].flags;
12260 cpu_arch_isa = cpu_arch[j].type;
12261 cpu_arch_isa_flags = cpu_arch[j].flags;
12262 if (!cpu_arch_tune_set)
12263 {
12264 cpu_arch_tune = cpu_arch_isa;
12265 cpu_arch_tune_flags = cpu_arch_isa_flags;
12266 }
12267 break;
12268 }
12269 else if (*cpu_arch [j].name == '.'
12270 && strcmp (arch, cpu_arch [j].name + 1) == 0)
12271 {
12272 /* ISA extension. */
12273 i386_cpu_flags flags;
12274
12275 flags = cpu_flags_or (cpu_arch_flags,
12276 cpu_arch[j].flags);
12277
12278 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
12279 {
12280 if (cpu_sub_arch_name)
12281 {
12282 char *name = cpu_sub_arch_name;
12283 cpu_sub_arch_name = concat (name,
12284 cpu_arch[j].name,
12285 (const char *) NULL);
12286 free (name);
12287 }
12288 else
12289 cpu_sub_arch_name = xstrdup (cpu_arch[j].name);
12290 cpu_arch_flags = flags;
12291 cpu_arch_isa_flags = flags;
12292 }
12293 else
12294 cpu_arch_isa_flags
12295 = cpu_flags_or (cpu_arch_isa_flags,
12296 cpu_arch[j].flags);
12297 break;
12298 }
12299 }
12300
12301 if (j >= ARRAY_SIZE (cpu_arch))
12302 {
12303 /* Disable an ISA extension. */
12304 for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
12305 if (strcmp (arch, cpu_noarch [j].name) == 0)
12306 {
12307 i386_cpu_flags flags;
12308
12309 flags = cpu_flags_and_not (cpu_arch_flags,
12310 cpu_noarch[j].flags);
12311 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
12312 {
12313 if (cpu_sub_arch_name)
12314 {
12315 char *name = cpu_sub_arch_name;
12316 cpu_sub_arch_name = concat (arch,
12317 (const char *) NULL);
12318 free (name);
12319 }
12320 else
12321 cpu_sub_arch_name = xstrdup (arch);
12322 cpu_arch_flags = flags;
12323 cpu_arch_isa_flags = flags;
12324 }
12325 break;
12326 }
12327
12328 if (j >= ARRAY_SIZE (cpu_noarch))
12329 j = ARRAY_SIZE (cpu_arch);
12330 }
12331
12332 if (j >= ARRAY_SIZE (cpu_arch))
12333 as_fatal (_("invalid -march= option: `%s'"), arg);
12334
12335 arch = next;
12336 }
12337 while (next != NULL);
12338 free (saved);
12339 break;
12340
12341 case OPTION_MTUNE:
12342 if (*arg == '.')
12343 as_fatal (_("invalid -mtune= option: `%s'"), arg);
12344 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
12345 {
12346 if (strcmp (arg, cpu_arch [j].name) == 0)
12347 {
12348 cpu_arch_tune_set = 1;
12349 cpu_arch_tune = cpu_arch [j].type;
12350 cpu_arch_tune_flags = cpu_arch[j].flags;
12351 break;
12352 }
12353 }
12354 if (j >= ARRAY_SIZE (cpu_arch))
12355 as_fatal (_("invalid -mtune= option: `%s'"), arg);
12356 break;
12357
12358 case OPTION_MMNEMONIC:
12359 if (strcasecmp (arg, "att") == 0)
12360 intel_mnemonic = 0;
12361 else if (strcasecmp (arg, "intel") == 0)
12362 intel_mnemonic = 1;
12363 else
12364 as_fatal (_("invalid -mmnemonic= option: `%s'"), arg);
12365 break;
12366
12367 case OPTION_MSYNTAX:
12368 if (strcasecmp (arg, "att") == 0)
12369 intel_syntax = 0;
12370 else if (strcasecmp (arg, "intel") == 0)
12371 intel_syntax = 1;
12372 else
12373 as_fatal (_("invalid -msyntax= option: `%s'"), arg);
12374 break;
12375
12376 case OPTION_MINDEX_REG:
12377 allow_index_reg = 1;
12378 break;
12379
12380 case OPTION_MNAKED_REG:
12381 allow_naked_reg = 1;
12382 break;
12383
12384 case OPTION_MSSE2AVX:
12385 sse2avx = 1;
12386 break;
12387
12388 case OPTION_MSSE_CHECK:
12389 if (strcasecmp (arg, "error") == 0)
12390 sse_check = check_error;
12391 else if (strcasecmp (arg, "warning") == 0)
12392 sse_check = check_warning;
12393 else if (strcasecmp (arg, "none") == 0)
12394 sse_check = check_none;
12395 else
12396 as_fatal (_("invalid -msse-check= option: `%s'"), arg);
12397 break;
12398
12399 case OPTION_MOPERAND_CHECK:
12400 if (strcasecmp (arg, "error") == 0)
12401 operand_check = check_error;
12402 else if (strcasecmp (arg, "warning") == 0)
12403 operand_check = check_warning;
12404 else if (strcasecmp (arg, "none") == 0)
12405 operand_check = check_none;
12406 else
12407 as_fatal (_("invalid -moperand-check= option: `%s'"), arg);
12408 break;
12409
12410 case OPTION_MAVXSCALAR:
12411 if (strcasecmp (arg, "128") == 0)
12412 avxscalar = vex128;
12413 else if (strcasecmp (arg, "256") == 0)
12414 avxscalar = vex256;
12415 else
12416 as_fatal (_("invalid -mavxscalar= option: `%s'"), arg);
12417 break;
12418
12419 case OPTION_MVEXWIG:
12420 if (strcmp (arg, "0") == 0)
12421 vexwig = vexw0;
12422 else if (strcmp (arg, "1") == 0)
12423 vexwig = vexw1;
12424 else
12425 as_fatal (_("invalid -mvexwig= option: `%s'"), arg);
12426 break;
12427
12428 case OPTION_MADD_BND_PREFIX:
12429 add_bnd_prefix = 1;
12430 break;
12431
12432 case OPTION_MEVEXLIG:
12433 if (strcmp (arg, "128") == 0)
12434 evexlig = evexl128;
12435 else if (strcmp (arg, "256") == 0)
12436 evexlig = evexl256;
12437 else if (strcmp (arg, "512") == 0)
12438 evexlig = evexl512;
12439 else
12440 as_fatal (_("invalid -mevexlig= option: `%s'"), arg);
12441 break;
12442
12443 case OPTION_MEVEXRCIG:
12444 if (strcmp (arg, "rne") == 0)
12445 evexrcig = rne;
12446 else if (strcmp (arg, "rd") == 0)
12447 evexrcig = rd;
12448 else if (strcmp (arg, "ru") == 0)
12449 evexrcig = ru;
12450 else if (strcmp (arg, "rz") == 0)
12451 evexrcig = rz;
12452 else
12453 as_fatal (_("invalid -mevexrcig= option: `%s'"), arg);
12454 break;
12455
12456 case OPTION_MEVEXWIG:
12457 if (strcmp (arg, "0") == 0)
12458 evexwig = evexw0;
12459 else if (strcmp (arg, "1") == 0)
12460 evexwig = evexw1;
12461 else
12462 as_fatal (_("invalid -mevexwig= option: `%s'"), arg);
12463 break;
12464
12465 # if defined (TE_PE) || defined (TE_PEP)
12466 case OPTION_MBIG_OBJ:
12467 use_big_obj = 1;
12468 break;
12469 #endif
12470
12471 case OPTION_MOMIT_LOCK_PREFIX:
12472 if (strcasecmp (arg, "yes") == 0)
12473 omit_lock_prefix = 1;
12474 else if (strcasecmp (arg, "no") == 0)
12475 omit_lock_prefix = 0;
12476 else
12477 as_fatal (_("invalid -momit-lock-prefix= option: `%s'"), arg);
12478 break;
12479
12480 case OPTION_MFENCE_AS_LOCK_ADD:
12481 if (strcasecmp (arg, "yes") == 0)
12482 avoid_fence = 1;
12483 else if (strcasecmp (arg, "no") == 0)
12484 avoid_fence = 0;
12485 else
12486 as_fatal (_("invalid -mfence-as-lock-add= option: `%s'"), arg);
12487 break;
12488
12489 case OPTION_MRELAX_RELOCATIONS:
12490 if (strcasecmp (arg, "yes") == 0)
12491 generate_relax_relocations = 1;
12492 else if (strcasecmp (arg, "no") == 0)
12493 generate_relax_relocations = 0;
12494 else
12495 as_fatal (_("invalid -mrelax-relocations= option: `%s'"), arg);
12496 break;
12497
12498 case OPTION_MALIGN_BRANCH_BOUNDARY:
12499 {
12500 char *end;
12501 long int align = strtoul (arg, &end, 0);
12502 if (*end == '\0')
12503 {
12504 if (align == 0)
12505 {
12506 align_branch_power = 0;
12507 break;
12508 }
12509 else if (align >= 16)
12510 {
12511 int align_power;
12512 for (align_power = 0;
12513 (align & 1) == 0;
12514 align >>= 1, align_power++)
12515 continue;
12516 /* Limit alignment power to 31. */
12517 if (align == 1 && align_power < 32)
12518 {
12519 align_branch_power = align_power;
12520 break;
12521 }
12522 }
12523 }
12524 as_fatal (_("invalid -malign-branch-boundary= value: %s"), arg);
12525 }
12526 break;
12527
12528 case OPTION_MALIGN_BRANCH_PREFIX_SIZE:
12529 {
12530 char *end;
12531 int align = strtoul (arg, &end, 0);
12532 /* Some processors only support 5 prefixes. */
12533 if (*end == '\0' && align >= 0 && align < 6)
12534 {
12535 align_branch_prefix_size = align;
12536 break;
12537 }
12538 as_fatal (_("invalid -malign-branch-prefix-size= value: %s"),
12539 arg);
12540 }
12541 break;
12542
12543 case OPTION_MALIGN_BRANCH:
12544 align_branch = 0;
12545 saved = xstrdup (arg);
12546 type = saved;
12547 do
12548 {
12549 next = strchr (type, '+');
12550 if (next)
12551 *next++ = '\0';
12552 if (strcasecmp (type, "jcc") == 0)
12553 align_branch |= align_branch_jcc_bit;
12554 else if (strcasecmp (type, "fused") == 0)
12555 align_branch |= align_branch_fused_bit;
12556 else if (strcasecmp (type, "jmp") == 0)
12557 align_branch |= align_branch_jmp_bit;
12558 else if (strcasecmp (type, "call") == 0)
12559 align_branch |= align_branch_call_bit;
12560 else if (strcasecmp (type, "ret") == 0)
12561 align_branch |= align_branch_ret_bit;
12562 else if (strcasecmp (type, "indirect") == 0)
12563 align_branch |= align_branch_indirect_bit;
12564 else
12565 as_fatal (_("invalid -malign-branch= option: `%s'"), arg);
12566 type = next;
12567 }
12568 while (next != NULL);
12569 free (saved);
12570 break;
12571
12572 case OPTION_MBRANCHES_WITH_32B_BOUNDARIES:
12573 align_branch_power = 5;
12574 align_branch_prefix_size = 5;
12575 align_branch = (align_branch_jcc_bit
12576 | align_branch_fused_bit
12577 | align_branch_jmp_bit);
12578 break;
12579
12580 case OPTION_MAMD64:
12581 isa64 = amd64;
12582 break;
12583
12584 case OPTION_MINTEL64:
12585 isa64 = intel64;
12586 break;
12587
12588 case 'O':
12589 if (arg == NULL)
12590 {
12591 optimize = 1;
12592 /* Turn off -Os. */
12593 optimize_for_space = 0;
12594 }
12595 else if (*arg == 's')
12596 {
12597 optimize_for_space = 1;
12598 /* Turn on all encoding optimizations. */
12599 optimize = INT_MAX;
12600 }
12601 else
12602 {
12603 optimize = atoi (arg);
12604 /* Turn off -Os. */
12605 optimize_for_space = 0;
12606 }
12607 break;
12608
12609 default:
12610 return 0;
12611 }
12612 return 1;
12613 }
12614
12615 #define MESSAGE_TEMPLATE \
12616 " "
12617
12618 static char *
12619 output_message (FILE *stream, char *p, char *message, char *start,
12620 int *left_p, const char *name, int len)
12621 {
12622 int size = sizeof (MESSAGE_TEMPLATE);
12623 int left = *left_p;
12624
12625 /* Reserve 2 spaces for ", " or ",\0" */
12626 left -= len + 2;
12627
12628 /* Check if there is any room. */
12629 if (left >= 0)
12630 {
12631 if (p != start)
12632 {
12633 *p++ = ',';
12634 *p++ = ' ';
12635 }
12636 p = mempcpy (p, name, len);
12637 }
12638 else
12639 {
12640 /* Output the current message now and start a new one. */
12641 *p++ = ',';
12642 *p = '\0';
12643 fprintf (stream, "%s\n", message);
12644 p = start;
12645 left = size - (start - message) - len - 2;
12646
12647 gas_assert (left >= 0);
12648
12649 p = mempcpy (p, name, len);
12650 }
12651
12652 *left_p = left;
12653 return p;
12654 }
12655
12656 static void
12657 show_arch (FILE *stream, int ext, int check)
12658 {
12659 static char message[] = MESSAGE_TEMPLATE;
12660 char *start = message + 27;
12661 char *p;
12662 int size = sizeof (MESSAGE_TEMPLATE);
12663 int left;
12664 const char *name;
12665 int len;
12666 unsigned int j;
12667
12668 p = start;
12669 left = size - (start - message);
12670 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
12671 {
12672 /* Should it be skipped? */
12673 if (cpu_arch [j].skip)
12674 continue;
12675
12676 name = cpu_arch [j].name;
12677 len = cpu_arch [j].len;
12678 if (*name == '.')
12679 {
12680 /* It is an extension. Skip if we aren't asked to show it. */
12681 if (ext)
12682 {
12683 name++;
12684 len--;
12685 }
12686 else
12687 continue;
12688 }
12689 else if (ext)
12690 {
12691 /* It is an processor. Skip if we show only extension. */
12692 continue;
12693 }
12694 else if (check && ! cpu_arch[j].flags.bitfield.cpui386)
12695 {
12696 /* It is an impossible processor - skip. */
12697 continue;
12698 }
12699
12700 p = output_message (stream, p, message, start, &left, name, len);
12701 }
12702
12703 /* Display disabled extensions. */
12704 if (ext)
12705 for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
12706 {
12707 name = cpu_noarch [j].name;
12708 len = cpu_noarch [j].len;
12709 p = output_message (stream, p, message, start, &left, name,
12710 len);
12711 }
12712
12713 *p = '\0';
12714 fprintf (stream, "%s\n", message);
12715 }
12716
12717 void
12718 md_show_usage (FILE *stream)
12719 {
12720 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12721 fprintf (stream, _("\
12722 -Qy, -Qn ignored\n\
12723 -V print assembler version number\n\
12724 -k ignored\n"));
12725 #endif
12726 fprintf (stream, _("\
12727 -n Do not optimize code alignment\n\
12728 -q quieten some warnings\n"));
12729 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12730 fprintf (stream, _("\
12731 -s ignored\n"));
12732 #endif
12733 #if defined BFD64 && (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
12734 || defined (TE_PE) || defined (TE_PEP))
12735 fprintf (stream, _("\
12736 --32/--64/--x32 generate 32bit/64bit/x32 code\n"));
12737 #endif
12738 #ifdef SVR4_COMMENT_CHARS
12739 fprintf (stream, _("\
12740 --divide do not treat `/' as a comment character\n"));
12741 #else
12742 fprintf (stream, _("\
12743 --divide ignored\n"));
12744 #endif
12745 fprintf (stream, _("\
12746 -march=CPU[,+EXTENSION...]\n\
12747 generate code for CPU and EXTENSION, CPU is one of:\n"));
12748 show_arch (stream, 0, 1);
12749 fprintf (stream, _("\
12750 EXTENSION is combination of:\n"));
12751 show_arch (stream, 1, 0);
12752 fprintf (stream, _("\
12753 -mtune=CPU optimize for CPU, CPU is one of:\n"));
12754 show_arch (stream, 0, 0);
12755 fprintf (stream, _("\
12756 -msse2avx encode SSE instructions with VEX prefix\n"));
12757 fprintf (stream, _("\
12758 -msse-check=[none|error|warning] (default: warning)\n\
12759 check SSE instructions\n"));
12760 fprintf (stream, _("\
12761 -moperand-check=[none|error|warning] (default: warning)\n\
12762 check operand combinations for validity\n"));
12763 fprintf (stream, _("\
12764 -mavxscalar=[128|256] (default: 128)\n\
12765 encode scalar AVX instructions with specific vector\n\
12766 length\n"));
12767 fprintf (stream, _("\
12768 -mvexwig=[0|1] (default: 0)\n\
12769 encode VEX instructions with specific VEX.W value\n\
12770 for VEX.W bit ignored instructions\n"));
12771 fprintf (stream, _("\
12772 -mevexlig=[128|256|512] (default: 128)\n\
12773 encode scalar EVEX instructions with specific vector\n\
12774 length\n"));
12775 fprintf (stream, _("\
12776 -mevexwig=[0|1] (default: 0)\n\
12777 encode EVEX instructions with specific EVEX.W value\n\
12778 for EVEX.W bit ignored instructions\n"));
12779 fprintf (stream, _("\
12780 -mevexrcig=[rne|rd|ru|rz] (default: rne)\n\
12781 encode EVEX instructions with specific EVEX.RC value\n\
12782 for SAE-only ignored instructions\n"));
12783 fprintf (stream, _("\
12784 -mmnemonic=[att|intel] "));
12785 if (SYSV386_COMPAT)
12786 fprintf (stream, _("(default: att)\n"));
12787 else
12788 fprintf (stream, _("(default: intel)\n"));
12789 fprintf (stream, _("\
12790 use AT&T/Intel mnemonic\n"));
12791 fprintf (stream, _("\
12792 -msyntax=[att|intel] (default: att)\n\
12793 use AT&T/Intel syntax\n"));
12794 fprintf (stream, _("\
12795 -mindex-reg support pseudo index registers\n"));
12796 fprintf (stream, _("\
12797 -mnaked-reg don't require `%%' prefix for registers\n"));
12798 fprintf (stream, _("\
12799 -madd-bnd-prefix add BND prefix for all valid branches\n"));
12800 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12801 fprintf (stream, _("\
12802 -mshared disable branch optimization for shared code\n"));
12803 fprintf (stream, _("\
12804 -mx86-used-note=[no|yes] "));
12805 if (DEFAULT_X86_USED_NOTE)
12806 fprintf (stream, _("(default: yes)\n"));
12807 else
12808 fprintf (stream, _("(default: no)\n"));
12809 fprintf (stream, _("\
12810 generate x86 used ISA and feature properties\n"));
12811 #endif
12812 #if defined (TE_PE) || defined (TE_PEP)
12813 fprintf (stream, _("\
12814 -mbig-obj generate big object files\n"));
12815 #endif
12816 fprintf (stream, _("\
12817 -momit-lock-prefix=[no|yes] (default: no)\n\
12818 strip all lock prefixes\n"));
12819 fprintf (stream, _("\
12820 -mfence-as-lock-add=[no|yes] (default: no)\n\
12821 encode lfence, mfence and sfence as\n\
12822 lock addl $0x0, (%%{re}sp)\n"));
12823 fprintf (stream, _("\
12824 -mrelax-relocations=[no|yes] "));
12825 if (DEFAULT_GENERATE_X86_RELAX_RELOCATIONS)
12826 fprintf (stream, _("(default: yes)\n"));
12827 else
12828 fprintf (stream, _("(default: no)\n"));
12829 fprintf (stream, _("\
12830 generate relax relocations\n"));
12831 fprintf (stream, _("\
12832 -malign-branch-boundary=NUM (default: 0)\n\
12833 align branches within NUM byte boundary\n"));
12834 fprintf (stream, _("\
12835 -malign-branch=TYPE[+TYPE...] (default: jcc+fused+jmp)\n\
12836 TYPE is combination of jcc, fused, jmp, call, ret,\n\
12837 indirect\n\
12838 specify types of branches to align\n"));
12839 fprintf (stream, _("\
12840 -malign-branch-prefix-size=NUM (default: 5)\n\
12841 align branches with NUM prefixes per instruction\n"));
12842 fprintf (stream, _("\
12843 -mbranches-within-32B-boundaries\n\
12844 align branches within 32 byte boundary\n"));
12845 fprintf (stream, _("\
12846 -mamd64 accept only AMD64 ISA [default]\n"));
12847 fprintf (stream, _("\
12848 -mintel64 accept only Intel64 ISA\n"));
12849 }
12850
12851 #if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
12852 || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
12853 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
12854
12855 /* Pick the target format to use. */
12856
12857 const char *
12858 i386_target_format (void)
12859 {
12860 if (!strncmp (default_arch, "x86_64", 6))
12861 {
12862 update_code_flag (CODE_64BIT, 1);
12863 if (default_arch[6] == '\0')
12864 x86_elf_abi = X86_64_ABI;
12865 else
12866 x86_elf_abi = X86_64_X32_ABI;
12867 }
12868 else if (!strcmp (default_arch, "i386"))
12869 update_code_flag (CODE_32BIT, 1);
12870 else if (!strcmp (default_arch, "iamcu"))
12871 {
12872 update_code_flag (CODE_32BIT, 1);
12873 if (cpu_arch_isa == PROCESSOR_UNKNOWN)
12874 {
12875 static const i386_cpu_flags iamcu_flags = CPU_IAMCU_FLAGS;
12876 cpu_arch_name = "iamcu";
12877 cpu_sub_arch_name = NULL;
12878 cpu_arch_flags = iamcu_flags;
12879 cpu_arch_isa = PROCESSOR_IAMCU;
12880 cpu_arch_isa_flags = iamcu_flags;
12881 if (!cpu_arch_tune_set)
12882 {
12883 cpu_arch_tune = cpu_arch_isa;
12884 cpu_arch_tune_flags = cpu_arch_isa_flags;
12885 }
12886 }
12887 else if (cpu_arch_isa != PROCESSOR_IAMCU)
12888 as_fatal (_("Intel MCU doesn't support `%s' architecture"),
12889 cpu_arch_name);
12890 }
12891 else
12892 as_fatal (_("unknown architecture"));
12893
12894 if (cpu_flags_all_zero (&cpu_arch_isa_flags))
12895 cpu_arch_isa_flags = cpu_arch[flag_code == CODE_64BIT].flags;
12896 if (cpu_flags_all_zero (&cpu_arch_tune_flags))
12897 cpu_arch_tune_flags = cpu_arch[flag_code == CODE_64BIT].flags;
12898
12899 switch (OUTPUT_FLAVOR)
12900 {
12901 #if defined (OBJ_MAYBE_AOUT) || defined (OBJ_AOUT)
12902 case bfd_target_aout_flavour:
12903 return AOUT_TARGET_FORMAT;
12904 #endif
12905 #if defined (OBJ_MAYBE_COFF) || defined (OBJ_COFF)
12906 # if defined (TE_PE) || defined (TE_PEP)
12907 case bfd_target_coff_flavour:
12908 if (flag_code == CODE_64BIT)
12909 return use_big_obj ? "pe-bigobj-x86-64" : "pe-x86-64";
12910 else
12911 return "pe-i386";
12912 # elif defined (TE_GO32)
12913 case bfd_target_coff_flavour:
12914 return "coff-go32";
12915 # else
12916 case bfd_target_coff_flavour:
12917 return "coff-i386";
12918 # endif
12919 #endif
12920 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
12921 case bfd_target_elf_flavour:
12922 {
12923 const char *format;
12924
12925 switch (x86_elf_abi)
12926 {
12927 default:
12928 format = ELF_TARGET_FORMAT;
12929 #ifndef TE_SOLARIS
12930 tls_get_addr = "___tls_get_addr";
12931 #endif
12932 break;
12933 case X86_64_ABI:
12934 use_rela_relocations = 1;
12935 object_64bit = 1;
12936 #ifndef TE_SOLARIS
12937 tls_get_addr = "__tls_get_addr";
12938 #endif
12939 format = ELF_TARGET_FORMAT64;
12940 break;
12941 case X86_64_X32_ABI:
12942 use_rela_relocations = 1;
12943 object_64bit = 1;
12944 #ifndef TE_SOLARIS
12945 tls_get_addr = "__tls_get_addr";
12946 #endif
12947 disallow_64bit_reloc = 1;
12948 format = ELF_TARGET_FORMAT32;
12949 break;
12950 }
12951 if (cpu_arch_isa == PROCESSOR_L1OM)
12952 {
12953 if (x86_elf_abi != X86_64_ABI)
12954 as_fatal (_("Intel L1OM is 64bit only"));
12955 return ELF_TARGET_L1OM_FORMAT;
12956 }
12957 else if (cpu_arch_isa == PROCESSOR_K1OM)
12958 {
12959 if (x86_elf_abi != X86_64_ABI)
12960 as_fatal (_("Intel K1OM is 64bit only"));
12961 return ELF_TARGET_K1OM_FORMAT;
12962 }
12963 else if (cpu_arch_isa == PROCESSOR_IAMCU)
12964 {
12965 if (x86_elf_abi != I386_ABI)
12966 as_fatal (_("Intel MCU is 32bit only"));
12967 return ELF_TARGET_IAMCU_FORMAT;
12968 }
12969 else
12970 return format;
12971 }
12972 #endif
12973 #if defined (OBJ_MACH_O)
12974 case bfd_target_mach_o_flavour:
12975 if (flag_code == CODE_64BIT)
12976 {
12977 use_rela_relocations = 1;
12978 object_64bit = 1;
12979 return "mach-o-x86-64";
12980 }
12981 else
12982 return "mach-o-i386";
12983 #endif
12984 default:
12985 abort ();
12986 return NULL;
12987 }
12988 }
12989
12990 #endif /* OBJ_MAYBE_ more than one */
12991 \f
12992 symbolS *
12993 md_undefined_symbol (char *name)
12994 {
12995 if (name[0] == GLOBAL_OFFSET_TABLE_NAME[0]
12996 && name[1] == GLOBAL_OFFSET_TABLE_NAME[1]
12997 && name[2] == GLOBAL_OFFSET_TABLE_NAME[2]
12998 && strcmp (name, GLOBAL_OFFSET_TABLE_NAME) == 0)
12999 {
13000 if (!GOT_symbol)
13001 {
13002 if (symbol_find (name))
13003 as_bad (_("GOT already in symbol table"));
13004 GOT_symbol = symbol_new (name, undefined_section,
13005 (valueT) 0, &zero_address_frag);
13006 };
13007 return GOT_symbol;
13008 }
13009 return 0;
13010 }
13011
13012 /* Round up a section size to the appropriate boundary. */
13013
13014 valueT
13015 md_section_align (segT segment ATTRIBUTE_UNUSED, valueT size)
13016 {
13017 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
13018 if (OUTPUT_FLAVOR == bfd_target_aout_flavour)
13019 {
13020 /* For a.out, force the section size to be aligned. If we don't do
13021 this, BFD will align it for us, but it will not write out the
13022 final bytes of the section. This may be a bug in BFD, but it is
13023 easier to fix it here since that is how the other a.out targets
13024 work. */
13025 int align;
13026
13027 align = bfd_section_alignment (segment);
13028 size = ((size + (1 << align) - 1) & (-((valueT) 1 << align)));
13029 }
13030 #endif
13031
13032 return size;
13033 }
13034
13035 /* On the i386, PC-relative offsets are relative to the start of the
13036 next instruction. That is, the address of the offset, plus its
13037 size, since the offset is always the last part of the insn. */
13038
13039 long
13040 md_pcrel_from (fixS *fixP)
13041 {
13042 return fixP->fx_size + fixP->fx_where + fixP->fx_frag->fr_address;
13043 }
13044
13045 #ifndef I386COFF
13046
13047 static void
13048 s_bss (int ignore ATTRIBUTE_UNUSED)
13049 {
13050 int temp;
13051
13052 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13053 if (IS_ELF)
13054 obj_elf_section_change_hook ();
13055 #endif
13056 temp = get_absolute_expression ();
13057 subseg_set (bss_section, (subsegT) temp);
13058 demand_empty_rest_of_line ();
13059 }
13060
13061 #endif
13062
13063 /* Remember constant directive. */
13064
13065 void
13066 i386_cons_align (int ignore ATTRIBUTE_UNUSED)
13067 {
13068 if (last_insn.kind != last_insn_directive
13069 && (bfd_section_flags (now_seg) & SEC_CODE))
13070 {
13071 last_insn.seg = now_seg;
13072 last_insn.kind = last_insn_directive;
13073 last_insn.name = "constant directive";
13074 last_insn.file = as_where (&last_insn.line);
13075 }
13076 }
13077
13078 void
13079 i386_validate_fix (fixS *fixp)
13080 {
13081 if (fixp->fx_subsy)
13082 {
13083 if (fixp->fx_subsy == GOT_symbol)
13084 {
13085 if (fixp->fx_r_type == BFD_RELOC_32_PCREL)
13086 {
13087 if (!object_64bit)
13088 abort ();
13089 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13090 if (fixp->fx_tcbit2)
13091 fixp->fx_r_type = (fixp->fx_tcbit
13092 ? BFD_RELOC_X86_64_REX_GOTPCRELX
13093 : BFD_RELOC_X86_64_GOTPCRELX);
13094 else
13095 #endif
13096 fixp->fx_r_type = BFD_RELOC_X86_64_GOTPCREL;
13097 }
13098 else
13099 {
13100 if (!object_64bit)
13101 fixp->fx_r_type = BFD_RELOC_386_GOTOFF;
13102 else
13103 fixp->fx_r_type = BFD_RELOC_X86_64_GOTOFF64;
13104 }
13105 fixp->fx_subsy = 0;
13106 }
13107 }
13108 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13109 else if (!object_64bit)
13110 {
13111 if (fixp->fx_r_type == BFD_RELOC_386_GOT32
13112 && fixp->fx_tcbit2)
13113 fixp->fx_r_type = BFD_RELOC_386_GOT32X;
13114 }
13115 #endif
13116 }
13117
13118 arelent *
13119 tc_gen_reloc (asection *section ATTRIBUTE_UNUSED, fixS *fixp)
13120 {
13121 arelent *rel;
13122 bfd_reloc_code_real_type code;
13123
13124 switch (fixp->fx_r_type)
13125 {
13126 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13127 case BFD_RELOC_SIZE32:
13128 case BFD_RELOC_SIZE64:
13129 if (S_IS_DEFINED (fixp->fx_addsy)
13130 && !S_IS_EXTERNAL (fixp->fx_addsy))
13131 {
13132 /* Resolve size relocation against local symbol to size of
13133 the symbol plus addend. */
13134 valueT value = S_GET_SIZE (fixp->fx_addsy) + fixp->fx_offset;
13135 if (fixp->fx_r_type == BFD_RELOC_SIZE32
13136 && !fits_in_unsigned_long (value))
13137 as_bad_where (fixp->fx_file, fixp->fx_line,
13138 _("symbol size computation overflow"));
13139 fixp->fx_addsy = NULL;
13140 fixp->fx_subsy = NULL;
13141 md_apply_fix (fixp, (valueT *) &value, NULL);
13142 return NULL;
13143 }
13144 #endif
13145 /* Fall through. */
13146
13147 case BFD_RELOC_X86_64_PLT32:
13148 case BFD_RELOC_X86_64_GOT32:
13149 case BFD_RELOC_X86_64_GOTPCREL:
13150 case BFD_RELOC_X86_64_GOTPCRELX:
13151 case BFD_RELOC_X86_64_REX_GOTPCRELX:
13152 case BFD_RELOC_386_PLT32:
13153 case BFD_RELOC_386_GOT32:
13154 case BFD_RELOC_386_GOT32X:
13155 case BFD_RELOC_386_GOTOFF:
13156 case BFD_RELOC_386_GOTPC:
13157 case BFD_RELOC_386_TLS_GD:
13158 case BFD_RELOC_386_TLS_LDM:
13159 case BFD_RELOC_386_TLS_LDO_32:
13160 case BFD_RELOC_386_TLS_IE_32:
13161 case BFD_RELOC_386_TLS_IE:
13162 case BFD_RELOC_386_TLS_GOTIE:
13163 case BFD_RELOC_386_TLS_LE_32:
13164 case BFD_RELOC_386_TLS_LE:
13165 case BFD_RELOC_386_TLS_GOTDESC:
13166 case BFD_RELOC_386_TLS_DESC_CALL:
13167 case BFD_RELOC_X86_64_TLSGD:
13168 case BFD_RELOC_X86_64_TLSLD:
13169 case BFD_RELOC_X86_64_DTPOFF32:
13170 case BFD_RELOC_X86_64_DTPOFF64:
13171 case BFD_RELOC_X86_64_GOTTPOFF:
13172 case BFD_RELOC_X86_64_TPOFF32:
13173 case BFD_RELOC_X86_64_TPOFF64:
13174 case BFD_RELOC_X86_64_GOTOFF64:
13175 case BFD_RELOC_X86_64_GOTPC32:
13176 case BFD_RELOC_X86_64_GOT64:
13177 case BFD_RELOC_X86_64_GOTPCREL64:
13178 case BFD_RELOC_X86_64_GOTPC64:
13179 case BFD_RELOC_X86_64_GOTPLT64:
13180 case BFD_RELOC_X86_64_PLTOFF64:
13181 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
13182 case BFD_RELOC_X86_64_TLSDESC_CALL:
13183 case BFD_RELOC_RVA:
13184 case BFD_RELOC_VTABLE_ENTRY:
13185 case BFD_RELOC_VTABLE_INHERIT:
13186 #ifdef TE_PE
13187 case BFD_RELOC_32_SECREL:
13188 #endif
13189 code = fixp->fx_r_type;
13190 break;
13191 case BFD_RELOC_X86_64_32S:
13192 if (!fixp->fx_pcrel)
13193 {
13194 /* Don't turn BFD_RELOC_X86_64_32S into BFD_RELOC_32. */
13195 code = fixp->fx_r_type;
13196 break;
13197 }
13198 /* Fall through. */
13199 default:
13200 if (fixp->fx_pcrel)
13201 {
13202 switch (fixp->fx_size)
13203 {
13204 default:
13205 as_bad_where (fixp->fx_file, fixp->fx_line,
13206 _("can not do %d byte pc-relative relocation"),
13207 fixp->fx_size);
13208 code = BFD_RELOC_32_PCREL;
13209 break;
13210 case 1: code = BFD_RELOC_8_PCREL; break;
13211 case 2: code = BFD_RELOC_16_PCREL; break;
13212 case 4: code = BFD_RELOC_32_PCREL; break;
13213 #ifdef BFD64
13214 case 8: code = BFD_RELOC_64_PCREL; break;
13215 #endif
13216 }
13217 }
13218 else
13219 {
13220 switch (fixp->fx_size)
13221 {
13222 default:
13223 as_bad_where (fixp->fx_file, fixp->fx_line,
13224 _("can not do %d byte relocation"),
13225 fixp->fx_size);
13226 code = BFD_RELOC_32;
13227 break;
13228 case 1: code = BFD_RELOC_8; break;
13229 case 2: code = BFD_RELOC_16; break;
13230 case 4: code = BFD_RELOC_32; break;
13231 #ifdef BFD64
13232 case 8: code = BFD_RELOC_64; break;
13233 #endif
13234 }
13235 }
13236 break;
13237 }
13238
13239 if ((code == BFD_RELOC_32
13240 || code == BFD_RELOC_32_PCREL
13241 || code == BFD_RELOC_X86_64_32S)
13242 && GOT_symbol
13243 && fixp->fx_addsy == GOT_symbol)
13244 {
13245 if (!object_64bit)
13246 code = BFD_RELOC_386_GOTPC;
13247 else
13248 code = BFD_RELOC_X86_64_GOTPC32;
13249 }
13250 if ((code == BFD_RELOC_64 || code == BFD_RELOC_64_PCREL)
13251 && GOT_symbol
13252 && fixp->fx_addsy == GOT_symbol)
13253 {
13254 code = BFD_RELOC_X86_64_GOTPC64;
13255 }
13256
13257 rel = XNEW (arelent);
13258 rel->sym_ptr_ptr = XNEW (asymbol *);
13259 *rel->sym_ptr_ptr = symbol_get_bfdsym (fixp->fx_addsy);
13260
13261 rel->address = fixp->fx_frag->fr_address + fixp->fx_where;
13262
13263 if (!use_rela_relocations)
13264 {
13265 /* HACK: Since i386 ELF uses Rel instead of Rela, encode the
13266 vtable entry to be used in the relocation's section offset. */
13267 if (fixp->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
13268 rel->address = fixp->fx_offset;
13269 #if defined (OBJ_COFF) && defined (TE_PE)
13270 else if (fixp->fx_addsy && S_IS_WEAK (fixp->fx_addsy))
13271 rel->addend = fixp->fx_addnumber - (S_GET_VALUE (fixp->fx_addsy) * 2);
13272 else
13273 #endif
13274 rel->addend = 0;
13275 }
13276 /* Use the rela in 64bit mode. */
13277 else
13278 {
13279 if (disallow_64bit_reloc)
13280 switch (code)
13281 {
13282 case BFD_RELOC_X86_64_DTPOFF64:
13283 case BFD_RELOC_X86_64_TPOFF64:
13284 case BFD_RELOC_64_PCREL:
13285 case BFD_RELOC_X86_64_GOTOFF64:
13286 case BFD_RELOC_X86_64_GOT64:
13287 case BFD_RELOC_X86_64_GOTPCREL64:
13288 case BFD_RELOC_X86_64_GOTPC64:
13289 case BFD_RELOC_X86_64_GOTPLT64:
13290 case BFD_RELOC_X86_64_PLTOFF64:
13291 as_bad_where (fixp->fx_file, fixp->fx_line,
13292 _("cannot represent relocation type %s in x32 mode"),
13293 bfd_get_reloc_code_name (code));
13294 break;
13295 default:
13296 break;
13297 }
13298
13299 if (!fixp->fx_pcrel)
13300 rel->addend = fixp->fx_offset;
13301 else
13302 switch (code)
13303 {
13304 case BFD_RELOC_X86_64_PLT32:
13305 case BFD_RELOC_X86_64_GOT32:
13306 case BFD_RELOC_X86_64_GOTPCREL:
13307 case BFD_RELOC_X86_64_GOTPCRELX:
13308 case BFD_RELOC_X86_64_REX_GOTPCRELX:
13309 case BFD_RELOC_X86_64_TLSGD:
13310 case BFD_RELOC_X86_64_TLSLD:
13311 case BFD_RELOC_X86_64_GOTTPOFF:
13312 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
13313 case BFD_RELOC_X86_64_TLSDESC_CALL:
13314 rel->addend = fixp->fx_offset - fixp->fx_size;
13315 break;
13316 default:
13317 rel->addend = (section->vma
13318 - fixp->fx_size
13319 + fixp->fx_addnumber
13320 + md_pcrel_from (fixp));
13321 break;
13322 }
13323 }
13324
13325 rel->howto = bfd_reloc_type_lookup (stdoutput, code);
13326 if (rel->howto == NULL)
13327 {
13328 as_bad_where (fixp->fx_file, fixp->fx_line,
13329 _("cannot represent relocation type %s"),
13330 bfd_get_reloc_code_name (code));
13331 /* Set howto to a garbage value so that we can keep going. */
13332 rel->howto = bfd_reloc_type_lookup (stdoutput, BFD_RELOC_32);
13333 gas_assert (rel->howto != NULL);
13334 }
13335
13336 return rel;
13337 }
13338
13339 #include "tc-i386-intel.c"
13340
13341 void
13342 tc_x86_parse_to_dw2regnum (expressionS *exp)
13343 {
13344 int saved_naked_reg;
13345 char saved_register_dot;
13346
13347 saved_naked_reg = allow_naked_reg;
13348 allow_naked_reg = 1;
13349 saved_register_dot = register_chars['.'];
13350 register_chars['.'] = '.';
13351 allow_pseudo_reg = 1;
13352 expression_and_evaluate (exp);
13353 allow_pseudo_reg = 0;
13354 register_chars['.'] = saved_register_dot;
13355 allow_naked_reg = saved_naked_reg;
13356
13357 if (exp->X_op == O_register && exp->X_add_number >= 0)
13358 {
13359 if ((addressT) exp->X_add_number < i386_regtab_size)
13360 {
13361 exp->X_op = O_constant;
13362 exp->X_add_number = i386_regtab[exp->X_add_number]
13363 .dw2_regnum[flag_code >> 1];
13364 }
13365 else
13366 exp->X_op = O_illegal;
13367 }
13368 }
13369
13370 void
13371 tc_x86_frame_initial_instructions (void)
13372 {
13373 static unsigned int sp_regno[2];
13374
13375 if (!sp_regno[flag_code >> 1])
13376 {
13377 char *saved_input = input_line_pointer;
13378 char sp[][4] = {"esp", "rsp"};
13379 expressionS exp;
13380
13381 input_line_pointer = sp[flag_code >> 1];
13382 tc_x86_parse_to_dw2regnum (&exp);
13383 gas_assert (exp.X_op == O_constant);
13384 sp_regno[flag_code >> 1] = exp.X_add_number;
13385 input_line_pointer = saved_input;
13386 }
13387
13388 cfi_add_CFA_def_cfa (sp_regno[flag_code >> 1], -x86_cie_data_alignment);
13389 cfi_add_CFA_offset (x86_dwarf2_return_column, x86_cie_data_alignment);
13390 }
13391
13392 int
13393 x86_dwarf2_addr_size (void)
13394 {
13395 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
13396 if (x86_elf_abi == X86_64_X32_ABI)
13397 return 4;
13398 #endif
13399 return bfd_arch_bits_per_address (stdoutput) / 8;
13400 }
13401
13402 int
13403 i386_elf_section_type (const char *str, size_t len)
13404 {
13405 if (flag_code == CODE_64BIT
13406 && len == sizeof ("unwind") - 1
13407 && strncmp (str, "unwind", 6) == 0)
13408 return SHT_X86_64_UNWIND;
13409
13410 return -1;
13411 }
13412
13413 #ifdef TE_SOLARIS
13414 void
13415 i386_solaris_fix_up_eh_frame (segT sec)
13416 {
13417 if (flag_code == CODE_64BIT)
13418 elf_section_type (sec) = SHT_X86_64_UNWIND;
13419 }
13420 #endif
13421
13422 #ifdef TE_PE
13423 void
13424 tc_pe_dwarf2_emit_offset (symbolS *symbol, unsigned int size)
13425 {
13426 expressionS exp;
13427
13428 exp.X_op = O_secrel;
13429 exp.X_add_symbol = symbol;
13430 exp.X_add_number = 0;
13431 emit_expr (&exp, size);
13432 }
13433 #endif
13434
13435 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13436 /* For ELF on x86-64, add support for SHF_X86_64_LARGE. */
13437
13438 bfd_vma
13439 x86_64_section_letter (int letter, const char **ptr_msg)
13440 {
13441 if (flag_code == CODE_64BIT)
13442 {
13443 if (letter == 'l')
13444 return SHF_X86_64_LARGE;
13445
13446 *ptr_msg = _("bad .section directive: want a,l,w,x,M,S,G,T in string");
13447 }
13448 else
13449 *ptr_msg = _("bad .section directive: want a,w,x,M,S,G,T in string");
13450 return -1;
13451 }
13452
13453 bfd_vma
13454 x86_64_section_word (char *str, size_t len)
13455 {
13456 if (len == 5 && flag_code == CODE_64BIT && CONST_STRNEQ (str, "large"))
13457 return SHF_X86_64_LARGE;
13458
13459 return -1;
13460 }
13461
13462 static void
13463 handle_large_common (int small ATTRIBUTE_UNUSED)
13464 {
13465 if (flag_code != CODE_64BIT)
13466 {
13467 s_comm_internal (0, elf_common_parse);
13468 as_warn (_(".largecomm supported only in 64bit mode, producing .comm"));
13469 }
13470 else
13471 {
13472 static segT lbss_section;
13473 asection *saved_com_section_ptr = elf_com_section_ptr;
13474 asection *saved_bss_section = bss_section;
13475
13476 if (lbss_section == NULL)
13477 {
13478 flagword applicable;
13479 segT seg = now_seg;
13480 subsegT subseg = now_subseg;
13481
13482 /* The .lbss section is for local .largecomm symbols. */
13483 lbss_section = subseg_new (".lbss", 0);
13484 applicable = bfd_applicable_section_flags (stdoutput);
13485 bfd_set_section_flags (lbss_section, applicable & SEC_ALLOC);
13486 seg_info (lbss_section)->bss = 1;
13487
13488 subseg_set (seg, subseg);
13489 }
13490
13491 elf_com_section_ptr = &_bfd_elf_large_com_section;
13492 bss_section = lbss_section;
13493
13494 s_comm_internal (0, elf_common_parse);
13495
13496 elf_com_section_ptr = saved_com_section_ptr;
13497 bss_section = saved_bss_section;
13498 }
13499 }
13500 #endif /* OBJ_ELF || OBJ_MAYBE_ELF */