]> git.ipfire.org Git - thirdparty/binutils-gdb.git/blob - gas/config/tc-i386.c
i386: Only check suffix in instruction mnemonic
[thirdparty/binutils-gdb.git] / gas / config / tc-i386.c
1 /* tc-i386.c -- Assemble code for the Intel 80386
2 Copyright (C) 1989-2019 Free Software Foundation, Inc.
3
4 This file is part of GAS, the GNU Assembler.
5
6 GAS is free software; you can redistribute it and/or modify
7 it under the terms of the GNU General Public License as published by
8 the Free Software Foundation; either version 3, or (at your option)
9 any later version.
10
11 GAS is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 GNU General Public License for more details.
15
16 You should have received a copy of the GNU General Public License
17 along with GAS; see the file COPYING. If not, write to the Free
18 Software Foundation, 51 Franklin Street - Fifth Floor, Boston, MA
19 02110-1301, USA. */
20
21 /* Intel 80386 machine specific gas.
22 Written by Eliot Dresselhaus (eliot@mgm.mit.edu).
23 x86_64 support by Jan Hubicka (jh@suse.cz)
24 VIA PadLock support by Michal Ludvig (mludvig@suse.cz)
25 Bugs & suggestions are completely welcome. This is free software.
26 Please help us make it better. */
27
28 #include "as.h"
29 #include "safe-ctype.h"
30 #include "subsegs.h"
31 #include "dwarf2dbg.h"
32 #include "dw2gencfi.h"
33 #include "elf/x86-64.h"
34 #include "opcodes/i386-init.h"
35
36 #ifdef HAVE_LIMITS_H
37 #include <limits.h>
38 #else
39 #ifdef HAVE_SYS_PARAM_H
40 #include <sys/param.h>
41 #endif
42 #ifndef INT_MAX
43 #define INT_MAX (int) (((unsigned) (-1)) >> 1)
44 #endif
45 #endif
46
47 #ifndef REGISTER_WARNINGS
48 #define REGISTER_WARNINGS 1
49 #endif
50
51 #ifndef INFER_ADDR_PREFIX
52 #define INFER_ADDR_PREFIX 1
53 #endif
54
55 #ifndef DEFAULT_ARCH
56 #define DEFAULT_ARCH "i386"
57 #endif
58
59 #ifndef INLINE
60 #if __GNUC__ >= 2
61 #define INLINE __inline__
62 #else
63 #define INLINE
64 #endif
65 #endif
66
67 /* Prefixes will be emitted in the order defined below.
68 WAIT_PREFIX must be the first prefix since FWAIT is really is an
69 instruction, and so must come before any prefixes.
70 The preferred prefix order is SEG_PREFIX, ADDR_PREFIX, DATA_PREFIX,
71 REP_PREFIX/HLE_PREFIX, LOCK_PREFIX. */
72 #define WAIT_PREFIX 0
73 #define SEG_PREFIX 1
74 #define ADDR_PREFIX 2
75 #define DATA_PREFIX 3
76 #define REP_PREFIX 4
77 #define HLE_PREFIX REP_PREFIX
78 #define BND_PREFIX REP_PREFIX
79 #define LOCK_PREFIX 5
80 #define REX_PREFIX 6 /* must come last. */
81 #define MAX_PREFIXES 7 /* max prefixes per opcode */
82
83 /* we define the syntax here (modulo base,index,scale syntax) */
84 #define REGISTER_PREFIX '%'
85 #define IMMEDIATE_PREFIX '$'
86 #define ABSOLUTE_PREFIX '*'
87
88 /* these are the instruction mnemonic suffixes in AT&T syntax or
89 memory operand size in Intel syntax. */
90 #define WORD_MNEM_SUFFIX 'w'
91 #define BYTE_MNEM_SUFFIX 'b'
92 #define SHORT_MNEM_SUFFIX 's'
93 #define LONG_MNEM_SUFFIX 'l'
94 #define QWORD_MNEM_SUFFIX 'q'
95 /* Intel Syntax. Use a non-ascii letter since since it never appears
96 in instructions. */
97 #define LONG_DOUBLE_MNEM_SUFFIX '\1'
98
99 #define END_OF_INSN '\0'
100
101 /* This matches the C -> StaticRounding alias in the opcode table. */
102 #define commutative staticrounding
103
104 /*
105 'templates' is for grouping together 'template' structures for opcodes
106 of the same name. This is only used for storing the insns in the grand
107 ole hash table of insns.
108 The templates themselves start at START and range up to (but not including)
109 END.
110 */
111 typedef struct
112 {
113 const insn_template *start;
114 const insn_template *end;
115 }
116 templates;
117
118 /* 386 operand encoding bytes: see 386 book for details of this. */
119 typedef struct
120 {
121 unsigned int regmem; /* codes register or memory operand */
122 unsigned int reg; /* codes register operand (or extended opcode) */
123 unsigned int mode; /* how to interpret regmem & reg */
124 }
125 modrm_byte;
126
127 /* x86-64 extension prefix. */
128 typedef int rex_byte;
129
130 /* 386 opcode byte to code indirect addressing. */
131 typedef struct
132 {
133 unsigned base;
134 unsigned index;
135 unsigned scale;
136 }
137 sib_byte;
138
139 /* x86 arch names, types and features */
140 typedef struct
141 {
142 const char *name; /* arch name */
143 unsigned int len; /* arch string length */
144 enum processor_type type; /* arch type */
145 i386_cpu_flags flags; /* cpu feature flags */
146 unsigned int skip; /* show_arch should skip this. */
147 }
148 arch_entry;
149
150 /* Used to turn off indicated flags. */
151 typedef struct
152 {
153 const char *name; /* arch name */
154 unsigned int len; /* arch string length */
155 i386_cpu_flags flags; /* cpu feature flags */
156 }
157 noarch_entry;
158
159 static void update_code_flag (int, int);
160 static void set_code_flag (int);
161 static void set_16bit_gcc_code_flag (int);
162 static void set_intel_syntax (int);
163 static void set_intel_mnemonic (int);
164 static void set_allow_index_reg (int);
165 static void set_check (int);
166 static void set_cpu_arch (int);
167 #ifdef TE_PE
168 static void pe_directive_secrel (int);
169 #endif
170 static void signed_cons (int);
171 static char *output_invalid (int c);
172 static int i386_finalize_immediate (segT, expressionS *, i386_operand_type,
173 const char *);
174 static int i386_finalize_displacement (segT, expressionS *, i386_operand_type,
175 const char *);
176 static int i386_att_operand (char *);
177 static int i386_intel_operand (char *, int);
178 static int i386_intel_simplify (expressionS *);
179 static int i386_intel_parse_name (const char *, expressionS *);
180 static const reg_entry *parse_register (char *, char **);
181 static char *parse_insn (char *, char *);
182 static char *parse_operands (char *, const char *);
183 static void swap_operands (void);
184 static void swap_2_operands (int, int);
185 static void optimize_imm (void);
186 static void optimize_disp (void);
187 static const insn_template *match_template (char);
188 static int check_string (void);
189 static int process_suffix (void);
190 static int check_byte_reg (void);
191 static int check_long_reg (void);
192 static int check_qword_reg (void);
193 static int check_word_reg (void);
194 static int finalize_imm (void);
195 static int process_operands (void);
196 static const seg_entry *build_modrm_byte (void);
197 static void output_insn (void);
198 static void output_imm (fragS *, offsetT);
199 static void output_disp (fragS *, offsetT);
200 #ifndef I386COFF
201 static void s_bss (int);
202 #endif
203 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
204 static void handle_large_common (int small ATTRIBUTE_UNUSED);
205
206 /* GNU_PROPERTY_X86_ISA_1_USED. */
207 static unsigned int x86_isa_1_used;
208 /* GNU_PROPERTY_X86_FEATURE_2_USED. */
209 static unsigned int x86_feature_2_used;
210 /* Generate x86 used ISA and feature properties. */
211 static unsigned int x86_used_note = DEFAULT_X86_USED_NOTE;
212 #endif
213
214 static const char *default_arch = DEFAULT_ARCH;
215
216 /* This struct describes rounding control and SAE in the instruction. */
217 struct RC_Operation
218 {
219 enum rc_type
220 {
221 rne = 0,
222 rd,
223 ru,
224 rz,
225 saeonly
226 } type;
227 int operand;
228 };
229
230 static struct RC_Operation rc_op;
231
232 /* The struct describes masking, applied to OPERAND in the instruction.
233 MASK is a pointer to the corresponding mask register. ZEROING tells
234 whether merging or zeroing mask is used. */
235 struct Mask_Operation
236 {
237 const reg_entry *mask;
238 unsigned int zeroing;
239 /* The operand where this operation is associated. */
240 int operand;
241 };
242
243 static struct Mask_Operation mask_op;
244
245 /* The struct describes broadcasting, applied to OPERAND. FACTOR is
246 broadcast factor. */
247 struct Broadcast_Operation
248 {
249 /* Type of broadcast: {1to2}, {1to4}, {1to8}, or {1to16}. */
250 int type;
251
252 /* Index of broadcasted operand. */
253 int operand;
254
255 /* Number of bytes to broadcast. */
256 int bytes;
257 };
258
259 static struct Broadcast_Operation broadcast_op;
260
261 /* VEX prefix. */
262 typedef struct
263 {
264 /* VEX prefix is either 2 byte or 3 byte. EVEX is 4 byte. */
265 unsigned char bytes[4];
266 unsigned int length;
267 /* Destination or source register specifier. */
268 const reg_entry *register_specifier;
269 } vex_prefix;
270
271 /* 'md_assemble ()' gathers together information and puts it into a
272 i386_insn. */
273
274 union i386_op
275 {
276 expressionS *disps;
277 expressionS *imms;
278 const reg_entry *regs;
279 };
280
281 enum i386_error
282 {
283 operand_size_mismatch,
284 operand_type_mismatch,
285 register_type_mismatch,
286 number_of_operands_mismatch,
287 invalid_instruction_suffix,
288 bad_imm4,
289 unsupported_with_intel_mnemonic,
290 unsupported_syntax,
291 unsupported,
292 invalid_vsib_address,
293 invalid_vector_register_set,
294 unsupported_vector_index_register,
295 unsupported_broadcast,
296 broadcast_needed,
297 unsupported_masking,
298 mask_not_on_destination,
299 no_default_mask,
300 unsupported_rc_sae,
301 rc_sae_operand_not_last_imm,
302 invalid_register_operand,
303 };
304
305 struct _i386_insn
306 {
307 /* TM holds the template for the insn were currently assembling. */
308 insn_template tm;
309
310 /* SUFFIX holds the instruction size suffix for byte, word, dword
311 or qword, if given. */
312 char suffix;
313
314 /* OPERANDS gives the number of given operands. */
315 unsigned int operands;
316
317 /* REG_OPERANDS, DISP_OPERANDS, MEM_OPERANDS, IMM_OPERANDS give the number
318 of given register, displacement, memory operands and immediate
319 operands. */
320 unsigned int reg_operands, disp_operands, mem_operands, imm_operands;
321
322 /* TYPES [i] is the type (see above #defines) which tells us how to
323 use OP[i] for the corresponding operand. */
324 i386_operand_type types[MAX_OPERANDS];
325
326 /* Displacement expression, immediate expression, or register for each
327 operand. */
328 union i386_op op[MAX_OPERANDS];
329
330 /* Flags for operands. */
331 unsigned int flags[MAX_OPERANDS];
332 #define Operand_PCrel 1
333 #define Operand_Mem 2
334
335 /* Relocation type for operand */
336 enum bfd_reloc_code_real reloc[MAX_OPERANDS];
337
338 /* BASE_REG, INDEX_REG, and LOG2_SCALE_FACTOR are used to encode
339 the base index byte below. */
340 const reg_entry *base_reg;
341 const reg_entry *index_reg;
342 unsigned int log2_scale_factor;
343
344 /* SEG gives the seg_entries of this insn. They are zero unless
345 explicit segment overrides are given. */
346 const seg_entry *seg[2];
347
348 /* Copied first memory operand string, for re-checking. */
349 char *memop1_string;
350
351 /* PREFIX holds all the given prefix opcodes (usually null).
352 PREFIXES is the number of prefix opcodes. */
353 unsigned int prefixes;
354 unsigned char prefix[MAX_PREFIXES];
355
356 /* Has MMX register operands. */
357 bfd_boolean has_regmmx;
358
359 /* Has XMM register operands. */
360 bfd_boolean has_regxmm;
361
362 /* Has YMM register operands. */
363 bfd_boolean has_regymm;
364
365 /* Has ZMM register operands. */
366 bfd_boolean has_regzmm;
367
368 /* RM and SIB are the modrm byte and the sib byte where the
369 addressing modes of this insn are encoded. */
370 modrm_byte rm;
371 rex_byte rex;
372 rex_byte vrex;
373 sib_byte sib;
374 vex_prefix vex;
375
376 /* Masking attributes. */
377 struct Mask_Operation *mask;
378
379 /* Rounding control and SAE attributes. */
380 struct RC_Operation *rounding;
381
382 /* Broadcasting attributes. */
383 struct Broadcast_Operation *broadcast;
384
385 /* Compressed disp8*N attribute. */
386 unsigned int memshift;
387
388 /* Prefer load or store in encoding. */
389 enum
390 {
391 dir_encoding_default = 0,
392 dir_encoding_load,
393 dir_encoding_store,
394 dir_encoding_swap
395 } dir_encoding;
396
397 /* Prefer 8bit or 32bit displacement in encoding. */
398 enum
399 {
400 disp_encoding_default = 0,
401 disp_encoding_8bit,
402 disp_encoding_32bit
403 } disp_encoding;
404
405 /* Prefer the REX byte in encoding. */
406 bfd_boolean rex_encoding;
407
408 /* Disable instruction size optimization. */
409 bfd_boolean no_optimize;
410
411 /* How to encode vector instructions. */
412 enum
413 {
414 vex_encoding_default = 0,
415 vex_encoding_vex2,
416 vex_encoding_vex3,
417 vex_encoding_evex
418 } vec_encoding;
419
420 /* REP prefix. */
421 const char *rep_prefix;
422
423 /* HLE prefix. */
424 const char *hle_prefix;
425
426 /* Have BND prefix. */
427 const char *bnd_prefix;
428
429 /* Have NOTRACK prefix. */
430 const char *notrack_prefix;
431
432 /* Error message. */
433 enum i386_error error;
434 };
435
436 typedef struct _i386_insn i386_insn;
437
438 /* Link RC type with corresponding string, that'll be looked for in
439 asm. */
440 struct RC_name
441 {
442 enum rc_type type;
443 const char *name;
444 unsigned int len;
445 };
446
447 static const struct RC_name RC_NamesTable[] =
448 {
449 { rne, STRING_COMMA_LEN ("rn-sae") },
450 { rd, STRING_COMMA_LEN ("rd-sae") },
451 { ru, STRING_COMMA_LEN ("ru-sae") },
452 { rz, STRING_COMMA_LEN ("rz-sae") },
453 { saeonly, STRING_COMMA_LEN ("sae") },
454 };
455
456 /* List of chars besides those in app.c:symbol_chars that can start an
457 operand. Used to prevent the scrubber eating vital white-space. */
458 const char extra_symbol_chars[] = "*%-([{}"
459 #ifdef LEX_AT
460 "@"
461 #endif
462 #ifdef LEX_QM
463 "?"
464 #endif
465 ;
466
467 #if (defined (TE_I386AIX) \
468 || ((defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)) \
469 && !defined (TE_GNU) \
470 && !defined (TE_LINUX) \
471 && !defined (TE_NACL) \
472 && !defined (TE_FreeBSD) \
473 && !defined (TE_DragonFly) \
474 && !defined (TE_NetBSD)))
475 /* This array holds the chars that always start a comment. If the
476 pre-processor is disabled, these aren't very useful. The option
477 --divide will remove '/' from this list. */
478 const char *i386_comment_chars = "#/";
479 #define SVR4_COMMENT_CHARS 1
480 #define PREFIX_SEPARATOR '\\'
481
482 #else
483 const char *i386_comment_chars = "#";
484 #define PREFIX_SEPARATOR '/'
485 #endif
486
487 /* This array holds the chars that only start a comment at the beginning of
488 a line. If the line seems to have the form '# 123 filename'
489 .line and .file directives will appear in the pre-processed output.
490 Note that input_file.c hand checks for '#' at the beginning of the
491 first line of the input file. This is because the compiler outputs
492 #NO_APP at the beginning of its output.
493 Also note that comments started like this one will always work if
494 '/' isn't otherwise defined. */
495 const char line_comment_chars[] = "#/";
496
497 const char line_separator_chars[] = ";";
498
499 /* Chars that can be used to separate mant from exp in floating point
500 nums. */
501 const char EXP_CHARS[] = "eE";
502
503 /* Chars that mean this number is a floating point constant
504 As in 0f12.456
505 or 0d1.2345e12. */
506 const char FLT_CHARS[] = "fFdDxX";
507
508 /* Tables for lexical analysis. */
509 static char mnemonic_chars[256];
510 static char register_chars[256];
511 static char operand_chars[256];
512 static char identifier_chars[256];
513 static char digit_chars[256];
514
515 /* Lexical macros. */
516 #define is_mnemonic_char(x) (mnemonic_chars[(unsigned char) x])
517 #define is_operand_char(x) (operand_chars[(unsigned char) x])
518 #define is_register_char(x) (register_chars[(unsigned char) x])
519 #define is_space_char(x) ((x) == ' ')
520 #define is_identifier_char(x) (identifier_chars[(unsigned char) x])
521 #define is_digit_char(x) (digit_chars[(unsigned char) x])
522
523 /* All non-digit non-letter characters that may occur in an operand. */
524 static char operand_special_chars[] = "%$-+(,)*._~/<>|&^!:[@]";
525
526 /* md_assemble() always leaves the strings it's passed unaltered. To
527 effect this we maintain a stack of saved characters that we've smashed
528 with '\0's (indicating end of strings for various sub-fields of the
529 assembler instruction). */
530 static char save_stack[32];
531 static char *save_stack_p;
532 #define END_STRING_AND_SAVE(s) \
533 do { *save_stack_p++ = *(s); *(s) = '\0'; } while (0)
534 #define RESTORE_END_STRING(s) \
535 do { *(s) = *--save_stack_p; } while (0)
536
537 /* The instruction we're assembling. */
538 static i386_insn i;
539
540 /* Possible templates for current insn. */
541 static const templates *current_templates;
542
543 /* Per instruction expressionS buffers: max displacements & immediates. */
544 static expressionS disp_expressions[MAX_MEMORY_OPERANDS];
545 static expressionS im_expressions[MAX_IMMEDIATE_OPERANDS];
546
547 /* Current operand we are working on. */
548 static int this_operand = -1;
549
550 /* We support four different modes. FLAG_CODE variable is used to distinguish
551 these. */
552
553 enum flag_code {
554 CODE_32BIT,
555 CODE_16BIT,
556 CODE_64BIT };
557
558 static enum flag_code flag_code;
559 static unsigned int object_64bit;
560 static unsigned int disallow_64bit_reloc;
561 static int use_rela_relocations = 0;
562
563 #if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
564 || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
565 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
566
567 /* The ELF ABI to use. */
568 enum x86_elf_abi
569 {
570 I386_ABI,
571 X86_64_ABI,
572 X86_64_X32_ABI
573 };
574
575 static enum x86_elf_abi x86_elf_abi = I386_ABI;
576 #endif
577
578 #if defined (TE_PE) || defined (TE_PEP)
579 /* Use big object file format. */
580 static int use_big_obj = 0;
581 #endif
582
583 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
584 /* 1 if generating code for a shared library. */
585 static int shared = 0;
586 #endif
587
588 /* 1 for intel syntax,
589 0 if att syntax. */
590 static int intel_syntax = 0;
591
592 /* 1 for Intel64 ISA,
593 0 if AMD64 ISA. */
594 static int intel64;
595
596 /* 1 for intel mnemonic,
597 0 if att mnemonic. */
598 static int intel_mnemonic = !SYSV386_COMPAT;
599
600 /* 1 if pseudo registers are permitted. */
601 static int allow_pseudo_reg = 0;
602
603 /* 1 if register prefix % not required. */
604 static int allow_naked_reg = 0;
605
606 /* 1 if the assembler should add BND prefix for all control-transferring
607 instructions supporting it, even if this prefix wasn't specified
608 explicitly. */
609 static int add_bnd_prefix = 0;
610
611 /* 1 if pseudo index register, eiz/riz, is allowed . */
612 static int allow_index_reg = 0;
613
614 /* 1 if the assembler should ignore LOCK prefix, even if it was
615 specified explicitly. */
616 static int omit_lock_prefix = 0;
617
618 /* 1 if the assembler should encode lfence, mfence, and sfence as
619 "lock addl $0, (%{re}sp)". */
620 static int avoid_fence = 0;
621
622 /* 1 if the assembler should generate relax relocations. */
623
624 static int generate_relax_relocations
625 = DEFAULT_GENERATE_X86_RELAX_RELOCATIONS;
626
627 static enum check_kind
628 {
629 check_none = 0,
630 check_warning,
631 check_error
632 }
633 sse_check, operand_check = check_warning;
634
635 /* Optimization:
636 1. Clear the REX_W bit with register operand if possible.
637 2. Above plus use 128bit vector instruction to clear the full vector
638 register.
639 */
640 static int optimize = 0;
641
642 /* Optimization:
643 1. Clear the REX_W bit with register operand if possible.
644 2. Above plus use 128bit vector instruction to clear the full vector
645 register.
646 3. Above plus optimize "test{q,l,w} $imm8,%r{64,32,16}" to
647 "testb $imm7,%r8".
648 */
649 static int optimize_for_space = 0;
650
651 /* Register prefix used for error message. */
652 static const char *register_prefix = "%";
653
654 /* Used in 16 bit gcc mode to add an l suffix to call, ret, enter,
655 leave, push, and pop instructions so that gcc has the same stack
656 frame as in 32 bit mode. */
657 static char stackop_size = '\0';
658
659 /* Non-zero to optimize code alignment. */
660 int optimize_align_code = 1;
661
662 /* Non-zero to quieten some warnings. */
663 static int quiet_warnings = 0;
664
665 /* CPU name. */
666 static const char *cpu_arch_name = NULL;
667 static char *cpu_sub_arch_name = NULL;
668
669 /* CPU feature flags. */
670 static i386_cpu_flags cpu_arch_flags = CPU_UNKNOWN_FLAGS;
671
672 /* If we have selected a cpu we are generating instructions for. */
673 static int cpu_arch_tune_set = 0;
674
675 /* Cpu we are generating instructions for. */
676 enum processor_type cpu_arch_tune = PROCESSOR_UNKNOWN;
677
678 /* CPU feature flags of cpu we are generating instructions for. */
679 static i386_cpu_flags cpu_arch_tune_flags;
680
681 /* CPU instruction set architecture used. */
682 enum processor_type cpu_arch_isa = PROCESSOR_UNKNOWN;
683
684 /* CPU feature flags of instruction set architecture used. */
685 i386_cpu_flags cpu_arch_isa_flags;
686
687 /* If set, conditional jumps are not automatically promoted to handle
688 larger than a byte offset. */
689 static unsigned int no_cond_jump_promotion = 0;
690
691 /* Encode SSE instructions with VEX prefix. */
692 static unsigned int sse2avx;
693
694 /* Encode scalar AVX instructions with specific vector length. */
695 static enum
696 {
697 vex128 = 0,
698 vex256
699 } avxscalar;
700
701 /* Encode VEX WIG instructions with specific vex.w. */
702 static enum
703 {
704 vexw0 = 0,
705 vexw1
706 } vexwig;
707
708 /* Encode scalar EVEX LIG instructions with specific vector length. */
709 static enum
710 {
711 evexl128 = 0,
712 evexl256,
713 evexl512
714 } evexlig;
715
716 /* Encode EVEX WIG instructions with specific evex.w. */
717 static enum
718 {
719 evexw0 = 0,
720 evexw1
721 } evexwig;
722
723 /* Value to encode in EVEX RC bits, for SAE-only instructions. */
724 static enum rc_type evexrcig = rne;
725
726 /* Pre-defined "_GLOBAL_OFFSET_TABLE_". */
727 static symbolS *GOT_symbol;
728
729 /* The dwarf2 return column, adjusted for 32 or 64 bit. */
730 unsigned int x86_dwarf2_return_column;
731
732 /* The dwarf2 data alignment, adjusted for 32 or 64 bit. */
733 int x86_cie_data_alignment;
734
735 /* Interface to relax_segment.
736 There are 3 major relax states for 386 jump insns because the
737 different types of jumps add different sizes to frags when we're
738 figuring out what sort of jump to choose to reach a given label. */
739
740 /* Types. */
741 #define UNCOND_JUMP 0
742 #define COND_JUMP 1
743 #define COND_JUMP86 2
744
745 /* Sizes. */
746 #define CODE16 1
747 #define SMALL 0
748 #define SMALL16 (SMALL | CODE16)
749 #define BIG 2
750 #define BIG16 (BIG | CODE16)
751
752 #ifndef INLINE
753 #ifdef __GNUC__
754 #define INLINE __inline__
755 #else
756 #define INLINE
757 #endif
758 #endif
759
760 #define ENCODE_RELAX_STATE(type, size) \
761 ((relax_substateT) (((type) << 2) | (size)))
762 #define TYPE_FROM_RELAX_STATE(s) \
763 ((s) >> 2)
764 #define DISP_SIZE_FROM_RELAX_STATE(s) \
765 ((((s) & 3) == BIG ? 4 : (((s) & 3) == BIG16 ? 2 : 1)))
766
767 /* This table is used by relax_frag to promote short jumps to long
768 ones where necessary. SMALL (short) jumps may be promoted to BIG
769 (32 bit long) ones, and SMALL16 jumps to BIG16 (16 bit long). We
770 don't allow a short jump in a 32 bit code segment to be promoted to
771 a 16 bit offset jump because it's slower (requires data size
772 prefix), and doesn't work, unless the destination is in the bottom
773 64k of the code segment (The top 16 bits of eip are zeroed). */
774
775 const relax_typeS md_relax_table[] =
776 {
777 /* The fields are:
778 1) most positive reach of this state,
779 2) most negative reach of this state,
780 3) how many bytes this mode will have in the variable part of the frag
781 4) which index into the table to try if we can't fit into this one. */
782
783 /* UNCOND_JUMP states. */
784 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG)},
785 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16)},
786 /* dword jmp adds 4 bytes to frag:
787 0 extra opcode bytes, 4 displacement bytes. */
788 {0, 0, 4, 0},
789 /* word jmp adds 2 byte2 to frag:
790 0 extra opcode bytes, 2 displacement bytes. */
791 {0, 0, 2, 0},
792
793 /* COND_JUMP states. */
794 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG)},
795 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG16)},
796 /* dword conditionals adds 5 bytes to frag:
797 1 extra opcode byte, 4 displacement bytes. */
798 {0, 0, 5, 0},
799 /* word conditionals add 3 bytes to frag:
800 1 extra opcode byte, 2 displacement bytes. */
801 {0, 0, 3, 0},
802
803 /* COND_JUMP86 states. */
804 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG)},
805 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG16)},
806 /* dword conditionals adds 5 bytes to frag:
807 1 extra opcode byte, 4 displacement bytes. */
808 {0, 0, 5, 0},
809 /* word conditionals add 4 bytes to frag:
810 1 displacement byte and a 3 byte long branch insn. */
811 {0, 0, 4, 0}
812 };
813
814 static const arch_entry cpu_arch[] =
815 {
816 /* Do not replace the first two entries - i386_target_format()
817 relies on them being there in this order. */
818 { STRING_COMMA_LEN ("generic32"), PROCESSOR_GENERIC32,
819 CPU_GENERIC32_FLAGS, 0 },
820 { STRING_COMMA_LEN ("generic64"), PROCESSOR_GENERIC64,
821 CPU_GENERIC64_FLAGS, 0 },
822 { STRING_COMMA_LEN ("i8086"), PROCESSOR_UNKNOWN,
823 CPU_NONE_FLAGS, 0 },
824 { STRING_COMMA_LEN ("i186"), PROCESSOR_UNKNOWN,
825 CPU_I186_FLAGS, 0 },
826 { STRING_COMMA_LEN ("i286"), PROCESSOR_UNKNOWN,
827 CPU_I286_FLAGS, 0 },
828 { STRING_COMMA_LEN ("i386"), PROCESSOR_I386,
829 CPU_I386_FLAGS, 0 },
830 { STRING_COMMA_LEN ("i486"), PROCESSOR_I486,
831 CPU_I486_FLAGS, 0 },
832 { STRING_COMMA_LEN ("i586"), PROCESSOR_PENTIUM,
833 CPU_I586_FLAGS, 0 },
834 { STRING_COMMA_LEN ("i686"), PROCESSOR_PENTIUMPRO,
835 CPU_I686_FLAGS, 0 },
836 { STRING_COMMA_LEN ("pentium"), PROCESSOR_PENTIUM,
837 CPU_I586_FLAGS, 0 },
838 { STRING_COMMA_LEN ("pentiumpro"), PROCESSOR_PENTIUMPRO,
839 CPU_PENTIUMPRO_FLAGS, 0 },
840 { STRING_COMMA_LEN ("pentiumii"), PROCESSOR_PENTIUMPRO,
841 CPU_P2_FLAGS, 0 },
842 { STRING_COMMA_LEN ("pentiumiii"),PROCESSOR_PENTIUMPRO,
843 CPU_P3_FLAGS, 0 },
844 { STRING_COMMA_LEN ("pentium4"), PROCESSOR_PENTIUM4,
845 CPU_P4_FLAGS, 0 },
846 { STRING_COMMA_LEN ("prescott"), PROCESSOR_NOCONA,
847 CPU_CORE_FLAGS, 0 },
848 { STRING_COMMA_LEN ("nocona"), PROCESSOR_NOCONA,
849 CPU_NOCONA_FLAGS, 0 },
850 { STRING_COMMA_LEN ("yonah"), PROCESSOR_CORE,
851 CPU_CORE_FLAGS, 1 },
852 { STRING_COMMA_LEN ("core"), PROCESSOR_CORE,
853 CPU_CORE_FLAGS, 0 },
854 { STRING_COMMA_LEN ("merom"), PROCESSOR_CORE2,
855 CPU_CORE2_FLAGS, 1 },
856 { STRING_COMMA_LEN ("core2"), PROCESSOR_CORE2,
857 CPU_CORE2_FLAGS, 0 },
858 { STRING_COMMA_LEN ("corei7"), PROCESSOR_COREI7,
859 CPU_COREI7_FLAGS, 0 },
860 { STRING_COMMA_LEN ("l1om"), PROCESSOR_L1OM,
861 CPU_L1OM_FLAGS, 0 },
862 { STRING_COMMA_LEN ("k1om"), PROCESSOR_K1OM,
863 CPU_K1OM_FLAGS, 0 },
864 { STRING_COMMA_LEN ("iamcu"), PROCESSOR_IAMCU,
865 CPU_IAMCU_FLAGS, 0 },
866 { STRING_COMMA_LEN ("k6"), PROCESSOR_K6,
867 CPU_K6_FLAGS, 0 },
868 { STRING_COMMA_LEN ("k6_2"), PROCESSOR_K6,
869 CPU_K6_2_FLAGS, 0 },
870 { STRING_COMMA_LEN ("athlon"), PROCESSOR_ATHLON,
871 CPU_ATHLON_FLAGS, 0 },
872 { STRING_COMMA_LEN ("sledgehammer"), PROCESSOR_K8,
873 CPU_K8_FLAGS, 1 },
874 { STRING_COMMA_LEN ("opteron"), PROCESSOR_K8,
875 CPU_K8_FLAGS, 0 },
876 { STRING_COMMA_LEN ("k8"), PROCESSOR_K8,
877 CPU_K8_FLAGS, 0 },
878 { STRING_COMMA_LEN ("amdfam10"), PROCESSOR_AMDFAM10,
879 CPU_AMDFAM10_FLAGS, 0 },
880 { STRING_COMMA_LEN ("bdver1"), PROCESSOR_BD,
881 CPU_BDVER1_FLAGS, 0 },
882 { STRING_COMMA_LEN ("bdver2"), PROCESSOR_BD,
883 CPU_BDVER2_FLAGS, 0 },
884 { STRING_COMMA_LEN ("bdver3"), PROCESSOR_BD,
885 CPU_BDVER3_FLAGS, 0 },
886 { STRING_COMMA_LEN ("bdver4"), PROCESSOR_BD,
887 CPU_BDVER4_FLAGS, 0 },
888 { STRING_COMMA_LEN ("znver1"), PROCESSOR_ZNVER,
889 CPU_ZNVER1_FLAGS, 0 },
890 { STRING_COMMA_LEN ("znver2"), PROCESSOR_ZNVER,
891 CPU_ZNVER2_FLAGS, 0 },
892 { STRING_COMMA_LEN ("btver1"), PROCESSOR_BT,
893 CPU_BTVER1_FLAGS, 0 },
894 { STRING_COMMA_LEN ("btver2"), PROCESSOR_BT,
895 CPU_BTVER2_FLAGS, 0 },
896 { STRING_COMMA_LEN (".8087"), PROCESSOR_UNKNOWN,
897 CPU_8087_FLAGS, 0 },
898 { STRING_COMMA_LEN (".287"), PROCESSOR_UNKNOWN,
899 CPU_287_FLAGS, 0 },
900 { STRING_COMMA_LEN (".387"), PROCESSOR_UNKNOWN,
901 CPU_387_FLAGS, 0 },
902 { STRING_COMMA_LEN (".687"), PROCESSOR_UNKNOWN,
903 CPU_687_FLAGS, 0 },
904 { STRING_COMMA_LEN (".cmov"), PROCESSOR_UNKNOWN,
905 CPU_CMOV_FLAGS, 0 },
906 { STRING_COMMA_LEN (".fxsr"), PROCESSOR_UNKNOWN,
907 CPU_FXSR_FLAGS, 0 },
908 { STRING_COMMA_LEN (".mmx"), PROCESSOR_UNKNOWN,
909 CPU_MMX_FLAGS, 0 },
910 { STRING_COMMA_LEN (".sse"), PROCESSOR_UNKNOWN,
911 CPU_SSE_FLAGS, 0 },
912 { STRING_COMMA_LEN (".sse2"), PROCESSOR_UNKNOWN,
913 CPU_SSE2_FLAGS, 0 },
914 { STRING_COMMA_LEN (".sse3"), PROCESSOR_UNKNOWN,
915 CPU_SSE3_FLAGS, 0 },
916 { STRING_COMMA_LEN (".ssse3"), PROCESSOR_UNKNOWN,
917 CPU_SSSE3_FLAGS, 0 },
918 { STRING_COMMA_LEN (".sse4.1"), PROCESSOR_UNKNOWN,
919 CPU_SSE4_1_FLAGS, 0 },
920 { STRING_COMMA_LEN (".sse4.2"), PROCESSOR_UNKNOWN,
921 CPU_SSE4_2_FLAGS, 0 },
922 { STRING_COMMA_LEN (".sse4"), PROCESSOR_UNKNOWN,
923 CPU_SSE4_2_FLAGS, 0 },
924 { STRING_COMMA_LEN (".avx"), PROCESSOR_UNKNOWN,
925 CPU_AVX_FLAGS, 0 },
926 { STRING_COMMA_LEN (".avx2"), PROCESSOR_UNKNOWN,
927 CPU_AVX2_FLAGS, 0 },
928 { STRING_COMMA_LEN (".avx512f"), PROCESSOR_UNKNOWN,
929 CPU_AVX512F_FLAGS, 0 },
930 { STRING_COMMA_LEN (".avx512cd"), PROCESSOR_UNKNOWN,
931 CPU_AVX512CD_FLAGS, 0 },
932 { STRING_COMMA_LEN (".avx512er"), PROCESSOR_UNKNOWN,
933 CPU_AVX512ER_FLAGS, 0 },
934 { STRING_COMMA_LEN (".avx512pf"), PROCESSOR_UNKNOWN,
935 CPU_AVX512PF_FLAGS, 0 },
936 { STRING_COMMA_LEN (".avx512dq"), PROCESSOR_UNKNOWN,
937 CPU_AVX512DQ_FLAGS, 0 },
938 { STRING_COMMA_LEN (".avx512bw"), PROCESSOR_UNKNOWN,
939 CPU_AVX512BW_FLAGS, 0 },
940 { STRING_COMMA_LEN (".avx512vl"), PROCESSOR_UNKNOWN,
941 CPU_AVX512VL_FLAGS, 0 },
942 { STRING_COMMA_LEN (".vmx"), PROCESSOR_UNKNOWN,
943 CPU_VMX_FLAGS, 0 },
944 { STRING_COMMA_LEN (".vmfunc"), PROCESSOR_UNKNOWN,
945 CPU_VMFUNC_FLAGS, 0 },
946 { STRING_COMMA_LEN (".smx"), PROCESSOR_UNKNOWN,
947 CPU_SMX_FLAGS, 0 },
948 { STRING_COMMA_LEN (".xsave"), PROCESSOR_UNKNOWN,
949 CPU_XSAVE_FLAGS, 0 },
950 { STRING_COMMA_LEN (".xsaveopt"), PROCESSOR_UNKNOWN,
951 CPU_XSAVEOPT_FLAGS, 0 },
952 { STRING_COMMA_LEN (".xsavec"), PROCESSOR_UNKNOWN,
953 CPU_XSAVEC_FLAGS, 0 },
954 { STRING_COMMA_LEN (".xsaves"), PROCESSOR_UNKNOWN,
955 CPU_XSAVES_FLAGS, 0 },
956 { STRING_COMMA_LEN (".aes"), PROCESSOR_UNKNOWN,
957 CPU_AES_FLAGS, 0 },
958 { STRING_COMMA_LEN (".pclmul"), PROCESSOR_UNKNOWN,
959 CPU_PCLMUL_FLAGS, 0 },
960 { STRING_COMMA_LEN (".clmul"), PROCESSOR_UNKNOWN,
961 CPU_PCLMUL_FLAGS, 1 },
962 { STRING_COMMA_LEN (".fsgsbase"), PROCESSOR_UNKNOWN,
963 CPU_FSGSBASE_FLAGS, 0 },
964 { STRING_COMMA_LEN (".rdrnd"), PROCESSOR_UNKNOWN,
965 CPU_RDRND_FLAGS, 0 },
966 { STRING_COMMA_LEN (".f16c"), PROCESSOR_UNKNOWN,
967 CPU_F16C_FLAGS, 0 },
968 { STRING_COMMA_LEN (".bmi2"), PROCESSOR_UNKNOWN,
969 CPU_BMI2_FLAGS, 0 },
970 { STRING_COMMA_LEN (".fma"), PROCESSOR_UNKNOWN,
971 CPU_FMA_FLAGS, 0 },
972 { STRING_COMMA_LEN (".fma4"), PROCESSOR_UNKNOWN,
973 CPU_FMA4_FLAGS, 0 },
974 { STRING_COMMA_LEN (".xop"), PROCESSOR_UNKNOWN,
975 CPU_XOP_FLAGS, 0 },
976 { STRING_COMMA_LEN (".lwp"), PROCESSOR_UNKNOWN,
977 CPU_LWP_FLAGS, 0 },
978 { STRING_COMMA_LEN (".movbe"), PROCESSOR_UNKNOWN,
979 CPU_MOVBE_FLAGS, 0 },
980 { STRING_COMMA_LEN (".cx16"), PROCESSOR_UNKNOWN,
981 CPU_CX16_FLAGS, 0 },
982 { STRING_COMMA_LEN (".ept"), PROCESSOR_UNKNOWN,
983 CPU_EPT_FLAGS, 0 },
984 { STRING_COMMA_LEN (".lzcnt"), PROCESSOR_UNKNOWN,
985 CPU_LZCNT_FLAGS, 0 },
986 { STRING_COMMA_LEN (".hle"), PROCESSOR_UNKNOWN,
987 CPU_HLE_FLAGS, 0 },
988 { STRING_COMMA_LEN (".rtm"), PROCESSOR_UNKNOWN,
989 CPU_RTM_FLAGS, 0 },
990 { STRING_COMMA_LEN (".invpcid"), PROCESSOR_UNKNOWN,
991 CPU_INVPCID_FLAGS, 0 },
992 { STRING_COMMA_LEN (".clflush"), PROCESSOR_UNKNOWN,
993 CPU_CLFLUSH_FLAGS, 0 },
994 { STRING_COMMA_LEN (".nop"), PROCESSOR_UNKNOWN,
995 CPU_NOP_FLAGS, 0 },
996 { STRING_COMMA_LEN (".syscall"), PROCESSOR_UNKNOWN,
997 CPU_SYSCALL_FLAGS, 0 },
998 { STRING_COMMA_LEN (".rdtscp"), PROCESSOR_UNKNOWN,
999 CPU_RDTSCP_FLAGS, 0 },
1000 { STRING_COMMA_LEN (".3dnow"), PROCESSOR_UNKNOWN,
1001 CPU_3DNOW_FLAGS, 0 },
1002 { STRING_COMMA_LEN (".3dnowa"), PROCESSOR_UNKNOWN,
1003 CPU_3DNOWA_FLAGS, 0 },
1004 { STRING_COMMA_LEN (".padlock"), PROCESSOR_UNKNOWN,
1005 CPU_PADLOCK_FLAGS, 0 },
1006 { STRING_COMMA_LEN (".pacifica"), PROCESSOR_UNKNOWN,
1007 CPU_SVME_FLAGS, 1 },
1008 { STRING_COMMA_LEN (".svme"), PROCESSOR_UNKNOWN,
1009 CPU_SVME_FLAGS, 0 },
1010 { STRING_COMMA_LEN (".sse4a"), PROCESSOR_UNKNOWN,
1011 CPU_SSE4A_FLAGS, 0 },
1012 { STRING_COMMA_LEN (".abm"), PROCESSOR_UNKNOWN,
1013 CPU_ABM_FLAGS, 0 },
1014 { STRING_COMMA_LEN (".bmi"), PROCESSOR_UNKNOWN,
1015 CPU_BMI_FLAGS, 0 },
1016 { STRING_COMMA_LEN (".tbm"), PROCESSOR_UNKNOWN,
1017 CPU_TBM_FLAGS, 0 },
1018 { STRING_COMMA_LEN (".adx"), PROCESSOR_UNKNOWN,
1019 CPU_ADX_FLAGS, 0 },
1020 { STRING_COMMA_LEN (".rdseed"), PROCESSOR_UNKNOWN,
1021 CPU_RDSEED_FLAGS, 0 },
1022 { STRING_COMMA_LEN (".prfchw"), PROCESSOR_UNKNOWN,
1023 CPU_PRFCHW_FLAGS, 0 },
1024 { STRING_COMMA_LEN (".smap"), PROCESSOR_UNKNOWN,
1025 CPU_SMAP_FLAGS, 0 },
1026 { STRING_COMMA_LEN (".mpx"), PROCESSOR_UNKNOWN,
1027 CPU_MPX_FLAGS, 0 },
1028 { STRING_COMMA_LEN (".sha"), PROCESSOR_UNKNOWN,
1029 CPU_SHA_FLAGS, 0 },
1030 { STRING_COMMA_LEN (".clflushopt"), PROCESSOR_UNKNOWN,
1031 CPU_CLFLUSHOPT_FLAGS, 0 },
1032 { STRING_COMMA_LEN (".prefetchwt1"), PROCESSOR_UNKNOWN,
1033 CPU_PREFETCHWT1_FLAGS, 0 },
1034 { STRING_COMMA_LEN (".se1"), PROCESSOR_UNKNOWN,
1035 CPU_SE1_FLAGS, 0 },
1036 { STRING_COMMA_LEN (".clwb"), PROCESSOR_UNKNOWN,
1037 CPU_CLWB_FLAGS, 0 },
1038 { STRING_COMMA_LEN (".avx512ifma"), PROCESSOR_UNKNOWN,
1039 CPU_AVX512IFMA_FLAGS, 0 },
1040 { STRING_COMMA_LEN (".avx512vbmi"), PROCESSOR_UNKNOWN,
1041 CPU_AVX512VBMI_FLAGS, 0 },
1042 { STRING_COMMA_LEN (".avx512_4fmaps"), PROCESSOR_UNKNOWN,
1043 CPU_AVX512_4FMAPS_FLAGS, 0 },
1044 { STRING_COMMA_LEN (".avx512_4vnniw"), PROCESSOR_UNKNOWN,
1045 CPU_AVX512_4VNNIW_FLAGS, 0 },
1046 { STRING_COMMA_LEN (".avx512_vpopcntdq"), PROCESSOR_UNKNOWN,
1047 CPU_AVX512_VPOPCNTDQ_FLAGS, 0 },
1048 { STRING_COMMA_LEN (".avx512_vbmi2"), PROCESSOR_UNKNOWN,
1049 CPU_AVX512_VBMI2_FLAGS, 0 },
1050 { STRING_COMMA_LEN (".avx512_vnni"), PROCESSOR_UNKNOWN,
1051 CPU_AVX512_VNNI_FLAGS, 0 },
1052 { STRING_COMMA_LEN (".avx512_bitalg"), PROCESSOR_UNKNOWN,
1053 CPU_AVX512_BITALG_FLAGS, 0 },
1054 { STRING_COMMA_LEN (".clzero"), PROCESSOR_UNKNOWN,
1055 CPU_CLZERO_FLAGS, 0 },
1056 { STRING_COMMA_LEN (".mwaitx"), PROCESSOR_UNKNOWN,
1057 CPU_MWAITX_FLAGS, 0 },
1058 { STRING_COMMA_LEN (".ospke"), PROCESSOR_UNKNOWN,
1059 CPU_OSPKE_FLAGS, 0 },
1060 { STRING_COMMA_LEN (".rdpid"), PROCESSOR_UNKNOWN,
1061 CPU_RDPID_FLAGS, 0 },
1062 { STRING_COMMA_LEN (".ptwrite"), PROCESSOR_UNKNOWN,
1063 CPU_PTWRITE_FLAGS, 0 },
1064 { STRING_COMMA_LEN (".ibt"), PROCESSOR_UNKNOWN,
1065 CPU_IBT_FLAGS, 0 },
1066 { STRING_COMMA_LEN (".shstk"), PROCESSOR_UNKNOWN,
1067 CPU_SHSTK_FLAGS, 0 },
1068 { STRING_COMMA_LEN (".gfni"), PROCESSOR_UNKNOWN,
1069 CPU_GFNI_FLAGS, 0 },
1070 { STRING_COMMA_LEN (".vaes"), PROCESSOR_UNKNOWN,
1071 CPU_VAES_FLAGS, 0 },
1072 { STRING_COMMA_LEN (".vpclmulqdq"), PROCESSOR_UNKNOWN,
1073 CPU_VPCLMULQDQ_FLAGS, 0 },
1074 { STRING_COMMA_LEN (".wbnoinvd"), PROCESSOR_UNKNOWN,
1075 CPU_WBNOINVD_FLAGS, 0 },
1076 { STRING_COMMA_LEN (".pconfig"), PROCESSOR_UNKNOWN,
1077 CPU_PCONFIG_FLAGS, 0 },
1078 { STRING_COMMA_LEN (".waitpkg"), PROCESSOR_UNKNOWN,
1079 CPU_WAITPKG_FLAGS, 0 },
1080 { STRING_COMMA_LEN (".cldemote"), PROCESSOR_UNKNOWN,
1081 CPU_CLDEMOTE_FLAGS, 0 },
1082 { STRING_COMMA_LEN (".movdiri"), PROCESSOR_UNKNOWN,
1083 CPU_MOVDIRI_FLAGS, 0 },
1084 { STRING_COMMA_LEN (".movdir64b"), PROCESSOR_UNKNOWN,
1085 CPU_MOVDIR64B_FLAGS, 0 },
1086 { STRING_COMMA_LEN (".avx512_bf16"), PROCESSOR_UNKNOWN,
1087 CPU_AVX512_BF16_FLAGS, 0 },
1088 { STRING_COMMA_LEN (".avx512_vp2intersect"), PROCESSOR_UNKNOWN,
1089 CPU_AVX512_VP2INTERSECT_FLAGS, 0 },
1090 { STRING_COMMA_LEN (".enqcmd"), PROCESSOR_UNKNOWN,
1091 CPU_ENQCMD_FLAGS, 0 },
1092 { STRING_COMMA_LEN (".rdpru"), PROCESSOR_UNKNOWN,
1093 CPU_RDPRU_FLAGS, 0 },
1094 { STRING_COMMA_LEN (".mcommit"), PROCESSOR_UNKNOWN,
1095 CPU_MCOMMIT_FLAGS, 0 },
1096 };
1097
1098 static const noarch_entry cpu_noarch[] =
1099 {
1100 { STRING_COMMA_LEN ("no87"), CPU_ANY_X87_FLAGS },
1101 { STRING_COMMA_LEN ("no287"), CPU_ANY_287_FLAGS },
1102 { STRING_COMMA_LEN ("no387"), CPU_ANY_387_FLAGS },
1103 { STRING_COMMA_LEN ("no687"), CPU_ANY_687_FLAGS },
1104 { STRING_COMMA_LEN ("nocmov"), CPU_ANY_CMOV_FLAGS },
1105 { STRING_COMMA_LEN ("nofxsr"), CPU_ANY_FXSR_FLAGS },
1106 { STRING_COMMA_LEN ("nommx"), CPU_ANY_MMX_FLAGS },
1107 { STRING_COMMA_LEN ("nosse"), CPU_ANY_SSE_FLAGS },
1108 { STRING_COMMA_LEN ("nosse2"), CPU_ANY_SSE2_FLAGS },
1109 { STRING_COMMA_LEN ("nosse3"), CPU_ANY_SSE3_FLAGS },
1110 { STRING_COMMA_LEN ("nossse3"), CPU_ANY_SSSE3_FLAGS },
1111 { STRING_COMMA_LEN ("nosse4.1"), CPU_ANY_SSE4_1_FLAGS },
1112 { STRING_COMMA_LEN ("nosse4.2"), CPU_ANY_SSE4_2_FLAGS },
1113 { STRING_COMMA_LEN ("nosse4"), CPU_ANY_SSE4_1_FLAGS },
1114 { STRING_COMMA_LEN ("noavx"), CPU_ANY_AVX_FLAGS },
1115 { STRING_COMMA_LEN ("noavx2"), CPU_ANY_AVX2_FLAGS },
1116 { STRING_COMMA_LEN ("noavx512f"), CPU_ANY_AVX512F_FLAGS },
1117 { STRING_COMMA_LEN ("noavx512cd"), CPU_ANY_AVX512CD_FLAGS },
1118 { STRING_COMMA_LEN ("noavx512er"), CPU_ANY_AVX512ER_FLAGS },
1119 { STRING_COMMA_LEN ("noavx512pf"), CPU_ANY_AVX512PF_FLAGS },
1120 { STRING_COMMA_LEN ("noavx512dq"), CPU_ANY_AVX512DQ_FLAGS },
1121 { STRING_COMMA_LEN ("noavx512bw"), CPU_ANY_AVX512BW_FLAGS },
1122 { STRING_COMMA_LEN ("noavx512vl"), CPU_ANY_AVX512VL_FLAGS },
1123 { STRING_COMMA_LEN ("noavx512ifma"), CPU_ANY_AVX512IFMA_FLAGS },
1124 { STRING_COMMA_LEN ("noavx512vbmi"), CPU_ANY_AVX512VBMI_FLAGS },
1125 { STRING_COMMA_LEN ("noavx512_4fmaps"), CPU_ANY_AVX512_4FMAPS_FLAGS },
1126 { STRING_COMMA_LEN ("noavx512_4vnniw"), CPU_ANY_AVX512_4VNNIW_FLAGS },
1127 { STRING_COMMA_LEN ("noavx512_vpopcntdq"), CPU_ANY_AVX512_VPOPCNTDQ_FLAGS },
1128 { STRING_COMMA_LEN ("noavx512_vbmi2"), CPU_ANY_AVX512_VBMI2_FLAGS },
1129 { STRING_COMMA_LEN ("noavx512_vnni"), CPU_ANY_AVX512_VNNI_FLAGS },
1130 { STRING_COMMA_LEN ("noavx512_bitalg"), CPU_ANY_AVX512_BITALG_FLAGS },
1131 { STRING_COMMA_LEN ("noibt"), CPU_ANY_IBT_FLAGS },
1132 { STRING_COMMA_LEN ("noshstk"), CPU_ANY_SHSTK_FLAGS },
1133 { STRING_COMMA_LEN ("nomovdiri"), CPU_ANY_MOVDIRI_FLAGS },
1134 { STRING_COMMA_LEN ("nomovdir64b"), CPU_ANY_MOVDIR64B_FLAGS },
1135 { STRING_COMMA_LEN ("noavx512_bf16"), CPU_ANY_AVX512_BF16_FLAGS },
1136 { STRING_COMMA_LEN ("noavx512_vp2intersect"), CPU_ANY_SHSTK_FLAGS },
1137 { STRING_COMMA_LEN ("noenqcmd"), CPU_ANY_ENQCMD_FLAGS },
1138 };
1139
1140 #ifdef I386COFF
1141 /* Like s_lcomm_internal in gas/read.c but the alignment string
1142 is allowed to be optional. */
1143
1144 static symbolS *
1145 pe_lcomm_internal (int needs_align, symbolS *symbolP, addressT size)
1146 {
1147 addressT align = 0;
1148
1149 SKIP_WHITESPACE ();
1150
1151 if (needs_align
1152 && *input_line_pointer == ',')
1153 {
1154 align = parse_align (needs_align - 1);
1155
1156 if (align == (addressT) -1)
1157 return NULL;
1158 }
1159 else
1160 {
1161 if (size >= 8)
1162 align = 3;
1163 else if (size >= 4)
1164 align = 2;
1165 else if (size >= 2)
1166 align = 1;
1167 else
1168 align = 0;
1169 }
1170
1171 bss_alloc (symbolP, size, align);
1172 return symbolP;
1173 }
1174
1175 static void
1176 pe_lcomm (int needs_align)
1177 {
1178 s_comm_internal (needs_align * 2, pe_lcomm_internal);
1179 }
1180 #endif
1181
1182 const pseudo_typeS md_pseudo_table[] =
1183 {
1184 #if !defined(OBJ_AOUT) && !defined(USE_ALIGN_PTWO)
1185 {"align", s_align_bytes, 0},
1186 #else
1187 {"align", s_align_ptwo, 0},
1188 #endif
1189 {"arch", set_cpu_arch, 0},
1190 #ifndef I386COFF
1191 {"bss", s_bss, 0},
1192 #else
1193 {"lcomm", pe_lcomm, 1},
1194 #endif
1195 {"ffloat", float_cons, 'f'},
1196 {"dfloat", float_cons, 'd'},
1197 {"tfloat", float_cons, 'x'},
1198 {"value", cons, 2},
1199 {"slong", signed_cons, 4},
1200 {"noopt", s_ignore, 0},
1201 {"optim", s_ignore, 0},
1202 {"code16gcc", set_16bit_gcc_code_flag, CODE_16BIT},
1203 {"code16", set_code_flag, CODE_16BIT},
1204 {"code32", set_code_flag, CODE_32BIT},
1205 #ifdef BFD64
1206 {"code64", set_code_flag, CODE_64BIT},
1207 #endif
1208 {"intel_syntax", set_intel_syntax, 1},
1209 {"att_syntax", set_intel_syntax, 0},
1210 {"intel_mnemonic", set_intel_mnemonic, 1},
1211 {"att_mnemonic", set_intel_mnemonic, 0},
1212 {"allow_index_reg", set_allow_index_reg, 1},
1213 {"disallow_index_reg", set_allow_index_reg, 0},
1214 {"sse_check", set_check, 0},
1215 {"operand_check", set_check, 1},
1216 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
1217 {"largecomm", handle_large_common, 0},
1218 #else
1219 {"file", dwarf2_directive_file, 0},
1220 {"loc", dwarf2_directive_loc, 0},
1221 {"loc_mark_labels", dwarf2_directive_loc_mark_labels, 0},
1222 #endif
1223 #ifdef TE_PE
1224 {"secrel32", pe_directive_secrel, 0},
1225 #endif
1226 {0, 0, 0}
1227 };
1228
1229 /* For interface with expression (). */
1230 extern char *input_line_pointer;
1231
1232 /* Hash table for instruction mnemonic lookup. */
1233 static struct hash_control *op_hash;
1234
1235 /* Hash table for register lookup. */
1236 static struct hash_control *reg_hash;
1237 \f
1238 /* Various efficient no-op patterns for aligning code labels.
1239 Note: Don't try to assemble the instructions in the comments.
1240 0L and 0w are not legal. */
1241 static const unsigned char f32_1[] =
1242 {0x90}; /* nop */
1243 static const unsigned char f32_2[] =
1244 {0x66,0x90}; /* xchg %ax,%ax */
1245 static const unsigned char f32_3[] =
1246 {0x8d,0x76,0x00}; /* leal 0(%esi),%esi */
1247 static const unsigned char f32_4[] =
1248 {0x8d,0x74,0x26,0x00}; /* leal 0(%esi,1),%esi */
1249 static const unsigned char f32_6[] =
1250 {0x8d,0xb6,0x00,0x00,0x00,0x00}; /* leal 0L(%esi),%esi */
1251 static const unsigned char f32_7[] =
1252 {0x8d,0xb4,0x26,0x00,0x00,0x00,0x00}; /* leal 0L(%esi,1),%esi */
1253 static const unsigned char f16_3[] =
1254 {0x8d,0x74,0x00}; /* lea 0(%si),%si */
1255 static const unsigned char f16_4[] =
1256 {0x8d,0xb4,0x00,0x00}; /* lea 0W(%si),%si */
1257 static const unsigned char jump_disp8[] =
1258 {0xeb}; /* jmp disp8 */
1259 static const unsigned char jump32_disp32[] =
1260 {0xe9}; /* jmp disp32 */
1261 static const unsigned char jump16_disp32[] =
1262 {0x66,0xe9}; /* jmp disp32 */
1263 /* 32-bit NOPs patterns. */
1264 static const unsigned char *const f32_patt[] = {
1265 f32_1, f32_2, f32_3, f32_4, NULL, f32_6, f32_7
1266 };
1267 /* 16-bit NOPs patterns. */
1268 static const unsigned char *const f16_patt[] = {
1269 f32_1, f32_2, f16_3, f16_4
1270 };
1271 /* nopl (%[re]ax) */
1272 static const unsigned char alt_3[] =
1273 {0x0f,0x1f,0x00};
1274 /* nopl 0(%[re]ax) */
1275 static const unsigned char alt_4[] =
1276 {0x0f,0x1f,0x40,0x00};
1277 /* nopl 0(%[re]ax,%[re]ax,1) */
1278 static const unsigned char alt_5[] =
1279 {0x0f,0x1f,0x44,0x00,0x00};
1280 /* nopw 0(%[re]ax,%[re]ax,1) */
1281 static const unsigned char alt_6[] =
1282 {0x66,0x0f,0x1f,0x44,0x00,0x00};
1283 /* nopl 0L(%[re]ax) */
1284 static const unsigned char alt_7[] =
1285 {0x0f,0x1f,0x80,0x00,0x00,0x00,0x00};
1286 /* nopl 0L(%[re]ax,%[re]ax,1) */
1287 static const unsigned char alt_8[] =
1288 {0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1289 /* nopw 0L(%[re]ax,%[re]ax,1) */
1290 static const unsigned char alt_9[] =
1291 {0x66,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1292 /* nopw %cs:0L(%[re]ax,%[re]ax,1) */
1293 static const unsigned char alt_10[] =
1294 {0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1295 /* data16 nopw %cs:0L(%eax,%eax,1) */
1296 static const unsigned char alt_11[] =
1297 {0x66,0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1298 /* 32-bit and 64-bit NOPs patterns. */
1299 static const unsigned char *const alt_patt[] = {
1300 f32_1, f32_2, alt_3, alt_4, alt_5, alt_6, alt_7, alt_8,
1301 alt_9, alt_10, alt_11
1302 };
1303
1304 /* Genenerate COUNT bytes of NOPs to WHERE from PATT with the maximum
1305 size of a single NOP instruction MAX_SINGLE_NOP_SIZE. */
1306
1307 static void
1308 i386_output_nops (char *where, const unsigned char *const *patt,
1309 int count, int max_single_nop_size)
1310
1311 {
1312 /* Place the longer NOP first. */
1313 int last;
1314 int offset;
1315 const unsigned char *nops;
1316
1317 if (max_single_nop_size < 1)
1318 {
1319 as_fatal (_("i386_output_nops called to generate nops of at most %d bytes!"),
1320 max_single_nop_size);
1321 return;
1322 }
1323
1324 nops = patt[max_single_nop_size - 1];
1325
1326 /* Use the smaller one if the requsted one isn't available. */
1327 if (nops == NULL)
1328 {
1329 max_single_nop_size--;
1330 nops = patt[max_single_nop_size - 1];
1331 }
1332
1333 last = count % max_single_nop_size;
1334
1335 count -= last;
1336 for (offset = 0; offset < count; offset += max_single_nop_size)
1337 memcpy (where + offset, nops, max_single_nop_size);
1338
1339 if (last)
1340 {
1341 nops = patt[last - 1];
1342 if (nops == NULL)
1343 {
1344 /* Use the smaller one plus one-byte NOP if the needed one
1345 isn't available. */
1346 last--;
1347 nops = patt[last - 1];
1348 memcpy (where + offset, nops, last);
1349 where[offset + last] = *patt[0];
1350 }
1351 else
1352 memcpy (where + offset, nops, last);
1353 }
1354 }
1355
1356 static INLINE int
1357 fits_in_imm7 (offsetT num)
1358 {
1359 return (num & 0x7f) == num;
1360 }
1361
1362 static INLINE int
1363 fits_in_imm31 (offsetT num)
1364 {
1365 return (num & 0x7fffffff) == num;
1366 }
1367
1368 /* Genenerate COUNT bytes of NOPs to WHERE with the maximum size of a
1369 single NOP instruction LIMIT. */
1370
1371 void
1372 i386_generate_nops (fragS *fragP, char *where, offsetT count, int limit)
1373 {
1374 const unsigned char *const *patt = NULL;
1375 int max_single_nop_size;
1376 /* Maximum number of NOPs before switching to jump over NOPs. */
1377 int max_number_of_nops;
1378
1379 switch (fragP->fr_type)
1380 {
1381 case rs_fill_nop:
1382 case rs_align_code:
1383 break;
1384 default:
1385 return;
1386 }
1387
1388 /* We need to decide which NOP sequence to use for 32bit and
1389 64bit. When -mtune= is used:
1390
1391 1. For PROCESSOR_I386, PROCESSOR_I486, PROCESSOR_PENTIUM and
1392 PROCESSOR_GENERIC32, f32_patt will be used.
1393 2. For the rest, alt_patt will be used.
1394
1395 When -mtune= isn't used, alt_patt will be used if
1396 cpu_arch_isa_flags has CpuNop. Otherwise, f32_patt will
1397 be used.
1398
1399 When -march= or .arch is used, we can't use anything beyond
1400 cpu_arch_isa_flags. */
1401
1402 if (flag_code == CODE_16BIT)
1403 {
1404 patt = f16_patt;
1405 max_single_nop_size = sizeof (f16_patt) / sizeof (f16_patt[0]);
1406 /* Limit number of NOPs to 2 in 16-bit mode. */
1407 max_number_of_nops = 2;
1408 }
1409 else
1410 {
1411 if (fragP->tc_frag_data.isa == PROCESSOR_UNKNOWN)
1412 {
1413 /* PROCESSOR_UNKNOWN means that all ISAs may be used. */
1414 switch (cpu_arch_tune)
1415 {
1416 case PROCESSOR_UNKNOWN:
1417 /* We use cpu_arch_isa_flags to check if we SHOULD
1418 optimize with nops. */
1419 if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1420 patt = alt_patt;
1421 else
1422 patt = f32_patt;
1423 break;
1424 case PROCESSOR_PENTIUM4:
1425 case PROCESSOR_NOCONA:
1426 case PROCESSOR_CORE:
1427 case PROCESSOR_CORE2:
1428 case PROCESSOR_COREI7:
1429 case PROCESSOR_L1OM:
1430 case PROCESSOR_K1OM:
1431 case PROCESSOR_GENERIC64:
1432 case PROCESSOR_K6:
1433 case PROCESSOR_ATHLON:
1434 case PROCESSOR_K8:
1435 case PROCESSOR_AMDFAM10:
1436 case PROCESSOR_BD:
1437 case PROCESSOR_ZNVER:
1438 case PROCESSOR_BT:
1439 patt = alt_patt;
1440 break;
1441 case PROCESSOR_I386:
1442 case PROCESSOR_I486:
1443 case PROCESSOR_PENTIUM:
1444 case PROCESSOR_PENTIUMPRO:
1445 case PROCESSOR_IAMCU:
1446 case PROCESSOR_GENERIC32:
1447 patt = f32_patt;
1448 break;
1449 }
1450 }
1451 else
1452 {
1453 switch (fragP->tc_frag_data.tune)
1454 {
1455 case PROCESSOR_UNKNOWN:
1456 /* When cpu_arch_isa is set, cpu_arch_tune shouldn't be
1457 PROCESSOR_UNKNOWN. */
1458 abort ();
1459 break;
1460
1461 case PROCESSOR_I386:
1462 case PROCESSOR_I486:
1463 case PROCESSOR_PENTIUM:
1464 case PROCESSOR_IAMCU:
1465 case PROCESSOR_K6:
1466 case PROCESSOR_ATHLON:
1467 case PROCESSOR_K8:
1468 case PROCESSOR_AMDFAM10:
1469 case PROCESSOR_BD:
1470 case PROCESSOR_ZNVER:
1471 case PROCESSOR_BT:
1472 case PROCESSOR_GENERIC32:
1473 /* We use cpu_arch_isa_flags to check if we CAN optimize
1474 with nops. */
1475 if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1476 patt = alt_patt;
1477 else
1478 patt = f32_patt;
1479 break;
1480 case PROCESSOR_PENTIUMPRO:
1481 case PROCESSOR_PENTIUM4:
1482 case PROCESSOR_NOCONA:
1483 case PROCESSOR_CORE:
1484 case PROCESSOR_CORE2:
1485 case PROCESSOR_COREI7:
1486 case PROCESSOR_L1OM:
1487 case PROCESSOR_K1OM:
1488 if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1489 patt = alt_patt;
1490 else
1491 patt = f32_patt;
1492 break;
1493 case PROCESSOR_GENERIC64:
1494 patt = alt_patt;
1495 break;
1496 }
1497 }
1498
1499 if (patt == f32_patt)
1500 {
1501 max_single_nop_size = sizeof (f32_patt) / sizeof (f32_patt[0]);
1502 /* Limit number of NOPs to 2 for older processors. */
1503 max_number_of_nops = 2;
1504 }
1505 else
1506 {
1507 max_single_nop_size = sizeof (alt_patt) / sizeof (alt_patt[0]);
1508 /* Limit number of NOPs to 7 for newer processors. */
1509 max_number_of_nops = 7;
1510 }
1511 }
1512
1513 if (limit == 0)
1514 limit = max_single_nop_size;
1515
1516 if (fragP->fr_type == rs_fill_nop)
1517 {
1518 /* Output NOPs for .nop directive. */
1519 if (limit > max_single_nop_size)
1520 {
1521 as_bad_where (fragP->fr_file, fragP->fr_line,
1522 _("invalid single nop size: %d "
1523 "(expect within [0, %d])"),
1524 limit, max_single_nop_size);
1525 return;
1526 }
1527 }
1528 else
1529 fragP->fr_var = count;
1530
1531 if ((count / max_single_nop_size) > max_number_of_nops)
1532 {
1533 /* Generate jump over NOPs. */
1534 offsetT disp = count - 2;
1535 if (fits_in_imm7 (disp))
1536 {
1537 /* Use "jmp disp8" if possible. */
1538 count = disp;
1539 where[0] = jump_disp8[0];
1540 where[1] = count;
1541 where += 2;
1542 }
1543 else
1544 {
1545 unsigned int size_of_jump;
1546
1547 if (flag_code == CODE_16BIT)
1548 {
1549 where[0] = jump16_disp32[0];
1550 where[1] = jump16_disp32[1];
1551 size_of_jump = 2;
1552 }
1553 else
1554 {
1555 where[0] = jump32_disp32[0];
1556 size_of_jump = 1;
1557 }
1558
1559 count -= size_of_jump + 4;
1560 if (!fits_in_imm31 (count))
1561 {
1562 as_bad_where (fragP->fr_file, fragP->fr_line,
1563 _("jump over nop padding out of range"));
1564 return;
1565 }
1566
1567 md_number_to_chars (where + size_of_jump, count, 4);
1568 where += size_of_jump + 4;
1569 }
1570 }
1571
1572 /* Generate multiple NOPs. */
1573 i386_output_nops (where, patt, count, limit);
1574 }
1575
1576 static INLINE int
1577 operand_type_all_zero (const union i386_operand_type *x)
1578 {
1579 switch (ARRAY_SIZE(x->array))
1580 {
1581 case 3:
1582 if (x->array[2])
1583 return 0;
1584 /* Fall through. */
1585 case 2:
1586 if (x->array[1])
1587 return 0;
1588 /* Fall through. */
1589 case 1:
1590 return !x->array[0];
1591 default:
1592 abort ();
1593 }
1594 }
1595
1596 static INLINE void
1597 operand_type_set (union i386_operand_type *x, unsigned int v)
1598 {
1599 switch (ARRAY_SIZE(x->array))
1600 {
1601 case 3:
1602 x->array[2] = v;
1603 /* Fall through. */
1604 case 2:
1605 x->array[1] = v;
1606 /* Fall through. */
1607 case 1:
1608 x->array[0] = v;
1609 /* Fall through. */
1610 break;
1611 default:
1612 abort ();
1613 }
1614
1615 x->bitfield.class = ClassNone;
1616 }
1617
1618 static INLINE int
1619 operand_type_equal (const union i386_operand_type *x,
1620 const union i386_operand_type *y)
1621 {
1622 switch (ARRAY_SIZE(x->array))
1623 {
1624 case 3:
1625 if (x->array[2] != y->array[2])
1626 return 0;
1627 /* Fall through. */
1628 case 2:
1629 if (x->array[1] != y->array[1])
1630 return 0;
1631 /* Fall through. */
1632 case 1:
1633 return x->array[0] == y->array[0];
1634 break;
1635 default:
1636 abort ();
1637 }
1638 }
1639
1640 static INLINE int
1641 cpu_flags_all_zero (const union i386_cpu_flags *x)
1642 {
1643 switch (ARRAY_SIZE(x->array))
1644 {
1645 case 4:
1646 if (x->array[3])
1647 return 0;
1648 /* Fall through. */
1649 case 3:
1650 if (x->array[2])
1651 return 0;
1652 /* Fall through. */
1653 case 2:
1654 if (x->array[1])
1655 return 0;
1656 /* Fall through. */
1657 case 1:
1658 return !x->array[0];
1659 default:
1660 abort ();
1661 }
1662 }
1663
1664 static INLINE int
1665 cpu_flags_equal (const union i386_cpu_flags *x,
1666 const union i386_cpu_flags *y)
1667 {
1668 switch (ARRAY_SIZE(x->array))
1669 {
1670 case 4:
1671 if (x->array[3] != y->array[3])
1672 return 0;
1673 /* Fall through. */
1674 case 3:
1675 if (x->array[2] != y->array[2])
1676 return 0;
1677 /* Fall through. */
1678 case 2:
1679 if (x->array[1] != y->array[1])
1680 return 0;
1681 /* Fall through. */
1682 case 1:
1683 return x->array[0] == y->array[0];
1684 break;
1685 default:
1686 abort ();
1687 }
1688 }
1689
1690 static INLINE int
1691 cpu_flags_check_cpu64 (i386_cpu_flags f)
1692 {
1693 return !((flag_code == CODE_64BIT && f.bitfield.cpuno64)
1694 || (flag_code != CODE_64BIT && f.bitfield.cpu64));
1695 }
1696
1697 static INLINE i386_cpu_flags
1698 cpu_flags_and (i386_cpu_flags x, i386_cpu_flags y)
1699 {
1700 switch (ARRAY_SIZE (x.array))
1701 {
1702 case 4:
1703 x.array [3] &= y.array [3];
1704 /* Fall through. */
1705 case 3:
1706 x.array [2] &= y.array [2];
1707 /* Fall through. */
1708 case 2:
1709 x.array [1] &= y.array [1];
1710 /* Fall through. */
1711 case 1:
1712 x.array [0] &= y.array [0];
1713 break;
1714 default:
1715 abort ();
1716 }
1717 return x;
1718 }
1719
1720 static INLINE i386_cpu_flags
1721 cpu_flags_or (i386_cpu_flags x, i386_cpu_flags y)
1722 {
1723 switch (ARRAY_SIZE (x.array))
1724 {
1725 case 4:
1726 x.array [3] |= y.array [3];
1727 /* Fall through. */
1728 case 3:
1729 x.array [2] |= y.array [2];
1730 /* Fall through. */
1731 case 2:
1732 x.array [1] |= y.array [1];
1733 /* Fall through. */
1734 case 1:
1735 x.array [0] |= y.array [0];
1736 break;
1737 default:
1738 abort ();
1739 }
1740 return x;
1741 }
1742
1743 static INLINE i386_cpu_flags
1744 cpu_flags_and_not (i386_cpu_flags x, i386_cpu_flags y)
1745 {
1746 switch (ARRAY_SIZE (x.array))
1747 {
1748 case 4:
1749 x.array [3] &= ~y.array [3];
1750 /* Fall through. */
1751 case 3:
1752 x.array [2] &= ~y.array [2];
1753 /* Fall through. */
1754 case 2:
1755 x.array [1] &= ~y.array [1];
1756 /* Fall through. */
1757 case 1:
1758 x.array [0] &= ~y.array [0];
1759 break;
1760 default:
1761 abort ();
1762 }
1763 return x;
1764 }
1765
1766 #define CPU_FLAGS_ARCH_MATCH 0x1
1767 #define CPU_FLAGS_64BIT_MATCH 0x2
1768
1769 #define CPU_FLAGS_PERFECT_MATCH \
1770 (CPU_FLAGS_ARCH_MATCH | CPU_FLAGS_64BIT_MATCH)
1771
1772 /* Return CPU flags match bits. */
1773
1774 static int
1775 cpu_flags_match (const insn_template *t)
1776 {
1777 i386_cpu_flags x = t->cpu_flags;
1778 int match = cpu_flags_check_cpu64 (x) ? CPU_FLAGS_64BIT_MATCH : 0;
1779
1780 x.bitfield.cpu64 = 0;
1781 x.bitfield.cpuno64 = 0;
1782
1783 if (cpu_flags_all_zero (&x))
1784 {
1785 /* This instruction is available on all archs. */
1786 match |= CPU_FLAGS_ARCH_MATCH;
1787 }
1788 else
1789 {
1790 /* This instruction is available only on some archs. */
1791 i386_cpu_flags cpu = cpu_arch_flags;
1792
1793 /* AVX512VL is no standalone feature - match it and then strip it. */
1794 if (x.bitfield.cpuavx512vl && !cpu.bitfield.cpuavx512vl)
1795 return match;
1796 x.bitfield.cpuavx512vl = 0;
1797
1798 cpu = cpu_flags_and (x, cpu);
1799 if (!cpu_flags_all_zero (&cpu))
1800 {
1801 if (x.bitfield.cpuavx)
1802 {
1803 /* We need to check a few extra flags with AVX. */
1804 if (cpu.bitfield.cpuavx
1805 && (!t->opcode_modifier.sse2avx || sse2avx)
1806 && (!x.bitfield.cpuaes || cpu.bitfield.cpuaes)
1807 && (!x.bitfield.cpugfni || cpu.bitfield.cpugfni)
1808 && (!x.bitfield.cpupclmul || cpu.bitfield.cpupclmul))
1809 match |= CPU_FLAGS_ARCH_MATCH;
1810 }
1811 else if (x.bitfield.cpuavx512f)
1812 {
1813 /* We need to check a few extra flags with AVX512F. */
1814 if (cpu.bitfield.cpuavx512f
1815 && (!x.bitfield.cpugfni || cpu.bitfield.cpugfni)
1816 && (!x.bitfield.cpuvaes || cpu.bitfield.cpuvaes)
1817 && (!x.bitfield.cpuvpclmulqdq || cpu.bitfield.cpuvpclmulqdq))
1818 match |= CPU_FLAGS_ARCH_MATCH;
1819 }
1820 else
1821 match |= CPU_FLAGS_ARCH_MATCH;
1822 }
1823 }
1824 return match;
1825 }
1826
1827 static INLINE i386_operand_type
1828 operand_type_and (i386_operand_type x, i386_operand_type y)
1829 {
1830 if (x.bitfield.class != y.bitfield.class)
1831 x.bitfield.class = ClassNone;
1832
1833 switch (ARRAY_SIZE (x.array))
1834 {
1835 case 3:
1836 x.array [2] &= y.array [2];
1837 /* Fall through. */
1838 case 2:
1839 x.array [1] &= y.array [1];
1840 /* Fall through. */
1841 case 1:
1842 x.array [0] &= y.array [0];
1843 break;
1844 default:
1845 abort ();
1846 }
1847 return x;
1848 }
1849
1850 static INLINE i386_operand_type
1851 operand_type_and_not (i386_operand_type x, i386_operand_type y)
1852 {
1853 gas_assert (y.bitfield.class == ClassNone);
1854
1855 switch (ARRAY_SIZE (x.array))
1856 {
1857 case 3:
1858 x.array [2] &= ~y.array [2];
1859 /* Fall through. */
1860 case 2:
1861 x.array [1] &= ~y.array [1];
1862 /* Fall through. */
1863 case 1:
1864 x.array [0] &= ~y.array [0];
1865 break;
1866 default:
1867 abort ();
1868 }
1869 return x;
1870 }
1871
1872 static INLINE i386_operand_type
1873 operand_type_or (i386_operand_type x, i386_operand_type y)
1874 {
1875 gas_assert (x.bitfield.class == ClassNone ||
1876 y.bitfield.class == ClassNone ||
1877 x.bitfield.class == y.bitfield.class);
1878
1879 switch (ARRAY_SIZE (x.array))
1880 {
1881 case 3:
1882 x.array [2] |= y.array [2];
1883 /* Fall through. */
1884 case 2:
1885 x.array [1] |= y.array [1];
1886 /* Fall through. */
1887 case 1:
1888 x.array [0] |= y.array [0];
1889 break;
1890 default:
1891 abort ();
1892 }
1893 return x;
1894 }
1895
1896 static INLINE i386_operand_type
1897 operand_type_xor (i386_operand_type x, i386_operand_type y)
1898 {
1899 gas_assert (y.bitfield.class == ClassNone);
1900
1901 switch (ARRAY_SIZE (x.array))
1902 {
1903 case 3:
1904 x.array [2] ^= y.array [2];
1905 /* Fall through. */
1906 case 2:
1907 x.array [1] ^= y.array [1];
1908 /* Fall through. */
1909 case 1:
1910 x.array [0] ^= y.array [0];
1911 break;
1912 default:
1913 abort ();
1914 }
1915 return x;
1916 }
1917
1918 static const i386_operand_type disp16 = OPERAND_TYPE_DISP16;
1919 static const i386_operand_type disp32 = OPERAND_TYPE_DISP32;
1920 static const i386_operand_type disp32s = OPERAND_TYPE_DISP32S;
1921 static const i386_operand_type disp16_32 = OPERAND_TYPE_DISP16_32;
1922 static const i386_operand_type anydisp = OPERAND_TYPE_ANYDISP;
1923 static const i386_operand_type anyimm = OPERAND_TYPE_ANYIMM;
1924 static const i386_operand_type regxmm = OPERAND_TYPE_REGXMM;
1925 static const i386_operand_type regmask = OPERAND_TYPE_REGMASK;
1926 static const i386_operand_type imm8 = OPERAND_TYPE_IMM8;
1927 static const i386_operand_type imm8s = OPERAND_TYPE_IMM8S;
1928 static const i386_operand_type imm16 = OPERAND_TYPE_IMM16;
1929 static const i386_operand_type imm32 = OPERAND_TYPE_IMM32;
1930 static const i386_operand_type imm32s = OPERAND_TYPE_IMM32S;
1931 static const i386_operand_type imm64 = OPERAND_TYPE_IMM64;
1932 static const i386_operand_type imm16_32 = OPERAND_TYPE_IMM16_32;
1933 static const i386_operand_type imm16_32s = OPERAND_TYPE_IMM16_32S;
1934 static const i386_operand_type imm16_32_32s = OPERAND_TYPE_IMM16_32_32S;
1935
1936 enum operand_type
1937 {
1938 reg,
1939 imm,
1940 disp,
1941 anymem
1942 };
1943
1944 static INLINE int
1945 operand_type_check (i386_operand_type t, enum operand_type c)
1946 {
1947 switch (c)
1948 {
1949 case reg:
1950 return t.bitfield.class == Reg;
1951
1952 case imm:
1953 return (t.bitfield.imm8
1954 || t.bitfield.imm8s
1955 || t.bitfield.imm16
1956 || t.bitfield.imm32
1957 || t.bitfield.imm32s
1958 || t.bitfield.imm64);
1959
1960 case disp:
1961 return (t.bitfield.disp8
1962 || t.bitfield.disp16
1963 || t.bitfield.disp32
1964 || t.bitfield.disp32s
1965 || t.bitfield.disp64);
1966
1967 case anymem:
1968 return (t.bitfield.disp8
1969 || t.bitfield.disp16
1970 || t.bitfield.disp32
1971 || t.bitfield.disp32s
1972 || t.bitfield.disp64
1973 || t.bitfield.baseindex);
1974
1975 default:
1976 abort ();
1977 }
1978
1979 return 0;
1980 }
1981
1982 /* Return 1 if there is no conflict in 8bit/16bit/32bit/64bit/80bit size
1983 between operand GIVEN and opeand WANTED for instruction template T. */
1984
1985 static INLINE int
1986 match_operand_size (const insn_template *t, unsigned int wanted,
1987 unsigned int given)
1988 {
1989 return !((i.types[given].bitfield.byte
1990 && !t->operand_types[wanted].bitfield.byte)
1991 || (i.types[given].bitfield.word
1992 && !t->operand_types[wanted].bitfield.word)
1993 || (i.types[given].bitfield.dword
1994 && !t->operand_types[wanted].bitfield.dword)
1995 || (i.types[given].bitfield.qword
1996 && !t->operand_types[wanted].bitfield.qword)
1997 || (i.types[given].bitfield.tbyte
1998 && !t->operand_types[wanted].bitfield.tbyte));
1999 }
2000
2001 /* Return 1 if there is no conflict in SIMD register between operand
2002 GIVEN and opeand WANTED for instruction template T. */
2003
2004 static INLINE int
2005 match_simd_size (const insn_template *t, unsigned int wanted,
2006 unsigned int given)
2007 {
2008 return !((i.types[given].bitfield.xmmword
2009 && !t->operand_types[wanted].bitfield.xmmword)
2010 || (i.types[given].bitfield.ymmword
2011 && !t->operand_types[wanted].bitfield.ymmword)
2012 || (i.types[given].bitfield.zmmword
2013 && !t->operand_types[wanted].bitfield.zmmword));
2014 }
2015
2016 /* Return 1 if there is no conflict in any size between operand GIVEN
2017 and opeand WANTED for instruction template T. */
2018
2019 static INLINE int
2020 match_mem_size (const insn_template *t, unsigned int wanted,
2021 unsigned int given)
2022 {
2023 return (match_operand_size (t, wanted, given)
2024 && !((i.types[given].bitfield.unspecified
2025 && !i.broadcast
2026 && !t->operand_types[wanted].bitfield.unspecified)
2027 || (i.types[given].bitfield.fword
2028 && !t->operand_types[wanted].bitfield.fword)
2029 /* For scalar opcode templates to allow register and memory
2030 operands at the same time, some special casing is needed
2031 here. Also for v{,p}broadcast*, {,v}pmov{s,z}*, and
2032 down-conversion vpmov*. */
2033 || ((t->operand_types[wanted].bitfield.class == RegSIMD
2034 && !t->opcode_modifier.broadcast
2035 && (t->operand_types[wanted].bitfield.byte
2036 || t->operand_types[wanted].bitfield.word
2037 || t->operand_types[wanted].bitfield.dword
2038 || t->operand_types[wanted].bitfield.qword))
2039 ? (i.types[given].bitfield.xmmword
2040 || i.types[given].bitfield.ymmword
2041 || i.types[given].bitfield.zmmword)
2042 : !match_simd_size(t, wanted, given))));
2043 }
2044
2045 /* Return value has MATCH_STRAIGHT set if there is no size conflict on any
2046 operands for instruction template T, and it has MATCH_REVERSE set if there
2047 is no size conflict on any operands for the template with operands reversed
2048 (and the template allows for reversing in the first place). */
2049
2050 #define MATCH_STRAIGHT 1
2051 #define MATCH_REVERSE 2
2052
2053 static INLINE unsigned int
2054 operand_size_match (const insn_template *t)
2055 {
2056 unsigned int j, match = MATCH_STRAIGHT;
2057
2058 /* Don't check jump instructions. */
2059 if (t->opcode_modifier.jump
2060 || t->opcode_modifier.jumpbyte
2061 || t->opcode_modifier.jumpdword
2062 || t->opcode_modifier.jumpintersegment)
2063 return match;
2064
2065 /* Check memory and accumulator operand size. */
2066 for (j = 0; j < i.operands; j++)
2067 {
2068 if (i.types[j].bitfield.class != Reg
2069 && i.types[j].bitfield.class != RegSIMD
2070 && t->operand_types[j].bitfield.anysize)
2071 continue;
2072
2073 if (t->operand_types[j].bitfield.class == Reg
2074 && !match_operand_size (t, j, j))
2075 {
2076 match = 0;
2077 break;
2078 }
2079
2080 if (t->operand_types[j].bitfield.class == RegSIMD
2081 && !match_simd_size (t, j, j))
2082 {
2083 match = 0;
2084 break;
2085 }
2086
2087 if (t->operand_types[j].bitfield.acc
2088 && (!match_operand_size (t, j, j) || !match_simd_size (t, j, j)))
2089 {
2090 match = 0;
2091 break;
2092 }
2093
2094 if ((i.flags[j] & Operand_Mem) && !match_mem_size (t, j, j))
2095 {
2096 match = 0;
2097 break;
2098 }
2099 }
2100
2101 if (!t->opcode_modifier.d)
2102 {
2103 mismatch:
2104 if (!match)
2105 i.error = operand_size_mismatch;
2106 return match;
2107 }
2108
2109 /* Check reverse. */
2110 gas_assert (i.operands >= 2 && i.operands <= 3);
2111
2112 for (j = 0; j < i.operands; j++)
2113 {
2114 unsigned int given = i.operands - j - 1;
2115
2116 if (t->operand_types[j].bitfield.class == Reg
2117 && !match_operand_size (t, j, given))
2118 goto mismatch;
2119
2120 if (t->operand_types[j].bitfield.class == RegSIMD
2121 && !match_simd_size (t, j, given))
2122 goto mismatch;
2123
2124 if (t->operand_types[j].bitfield.acc
2125 && (!match_operand_size (t, j, given)
2126 || !match_simd_size (t, j, given)))
2127 goto mismatch;
2128
2129 if ((i.flags[given] & Operand_Mem) && !match_mem_size (t, j, given))
2130 goto mismatch;
2131 }
2132
2133 return match | MATCH_REVERSE;
2134 }
2135
2136 static INLINE int
2137 operand_type_match (i386_operand_type overlap,
2138 i386_operand_type given)
2139 {
2140 i386_operand_type temp = overlap;
2141
2142 temp.bitfield.jumpabsolute = 0;
2143 temp.bitfield.unspecified = 0;
2144 temp.bitfield.byte = 0;
2145 temp.bitfield.word = 0;
2146 temp.bitfield.dword = 0;
2147 temp.bitfield.fword = 0;
2148 temp.bitfield.qword = 0;
2149 temp.bitfield.tbyte = 0;
2150 temp.bitfield.xmmword = 0;
2151 temp.bitfield.ymmword = 0;
2152 temp.bitfield.zmmword = 0;
2153 if (operand_type_all_zero (&temp))
2154 goto mismatch;
2155
2156 if (given.bitfield.baseindex == overlap.bitfield.baseindex
2157 && given.bitfield.jumpabsolute == overlap.bitfield.jumpabsolute)
2158 return 1;
2159
2160 mismatch:
2161 i.error = operand_type_mismatch;
2162 return 0;
2163 }
2164
2165 /* If given types g0 and g1 are registers they must be of the same type
2166 unless the expected operand type register overlap is null.
2167 Memory operand size of certain SIMD instructions is also being checked
2168 here. */
2169
2170 static INLINE int
2171 operand_type_register_match (i386_operand_type g0,
2172 i386_operand_type t0,
2173 i386_operand_type g1,
2174 i386_operand_type t1)
2175 {
2176 if (g0.bitfield.class != Reg
2177 && g0.bitfield.class != RegSIMD
2178 && (!operand_type_check (g0, anymem)
2179 || g0.bitfield.unspecified
2180 || t0.bitfield.class != RegSIMD))
2181 return 1;
2182
2183 if (g1.bitfield.class != Reg
2184 && g1.bitfield.class != RegSIMD
2185 && (!operand_type_check (g1, anymem)
2186 || g1.bitfield.unspecified
2187 || t1.bitfield.class != RegSIMD))
2188 return 1;
2189
2190 if (g0.bitfield.byte == g1.bitfield.byte
2191 && g0.bitfield.word == g1.bitfield.word
2192 && g0.bitfield.dword == g1.bitfield.dword
2193 && g0.bitfield.qword == g1.bitfield.qword
2194 && g0.bitfield.xmmword == g1.bitfield.xmmword
2195 && g0.bitfield.ymmword == g1.bitfield.ymmword
2196 && g0.bitfield.zmmword == g1.bitfield.zmmword)
2197 return 1;
2198
2199 if (!(t0.bitfield.byte & t1.bitfield.byte)
2200 && !(t0.bitfield.word & t1.bitfield.word)
2201 && !(t0.bitfield.dword & t1.bitfield.dword)
2202 && !(t0.bitfield.qword & t1.bitfield.qword)
2203 && !(t0.bitfield.xmmword & t1.bitfield.xmmword)
2204 && !(t0.bitfield.ymmword & t1.bitfield.ymmword)
2205 && !(t0.bitfield.zmmword & t1.bitfield.zmmword))
2206 return 1;
2207
2208 i.error = register_type_mismatch;
2209
2210 return 0;
2211 }
2212
2213 static INLINE unsigned int
2214 register_number (const reg_entry *r)
2215 {
2216 unsigned int nr = r->reg_num;
2217
2218 if (r->reg_flags & RegRex)
2219 nr += 8;
2220
2221 if (r->reg_flags & RegVRex)
2222 nr += 16;
2223
2224 return nr;
2225 }
2226
2227 static INLINE unsigned int
2228 mode_from_disp_size (i386_operand_type t)
2229 {
2230 if (t.bitfield.disp8)
2231 return 1;
2232 else if (t.bitfield.disp16
2233 || t.bitfield.disp32
2234 || t.bitfield.disp32s)
2235 return 2;
2236 else
2237 return 0;
2238 }
2239
2240 static INLINE int
2241 fits_in_signed_byte (addressT num)
2242 {
2243 return num + 0x80 <= 0xff;
2244 }
2245
2246 static INLINE int
2247 fits_in_unsigned_byte (addressT num)
2248 {
2249 return num <= 0xff;
2250 }
2251
2252 static INLINE int
2253 fits_in_unsigned_word (addressT num)
2254 {
2255 return num <= 0xffff;
2256 }
2257
2258 static INLINE int
2259 fits_in_signed_word (addressT num)
2260 {
2261 return num + 0x8000 <= 0xffff;
2262 }
2263
2264 static INLINE int
2265 fits_in_signed_long (addressT num ATTRIBUTE_UNUSED)
2266 {
2267 #ifndef BFD64
2268 return 1;
2269 #else
2270 return num + 0x80000000 <= 0xffffffff;
2271 #endif
2272 } /* fits_in_signed_long() */
2273
2274 static INLINE int
2275 fits_in_unsigned_long (addressT num ATTRIBUTE_UNUSED)
2276 {
2277 #ifndef BFD64
2278 return 1;
2279 #else
2280 return num <= 0xffffffff;
2281 #endif
2282 } /* fits_in_unsigned_long() */
2283
2284 static INLINE int
2285 fits_in_disp8 (offsetT num)
2286 {
2287 int shift = i.memshift;
2288 unsigned int mask;
2289
2290 if (shift == -1)
2291 abort ();
2292
2293 mask = (1 << shift) - 1;
2294
2295 /* Return 0 if NUM isn't properly aligned. */
2296 if ((num & mask))
2297 return 0;
2298
2299 /* Check if NUM will fit in 8bit after shift. */
2300 return fits_in_signed_byte (num >> shift);
2301 }
2302
2303 static INLINE int
2304 fits_in_imm4 (offsetT num)
2305 {
2306 return (num & 0xf) == num;
2307 }
2308
2309 static i386_operand_type
2310 smallest_imm_type (offsetT num)
2311 {
2312 i386_operand_type t;
2313
2314 operand_type_set (&t, 0);
2315 t.bitfield.imm64 = 1;
2316
2317 if (cpu_arch_tune != PROCESSOR_I486 && num == 1)
2318 {
2319 /* This code is disabled on the 486 because all the Imm1 forms
2320 in the opcode table are slower on the i486. They're the
2321 versions with the implicitly specified single-position
2322 displacement, which has another syntax if you really want to
2323 use that form. */
2324 t.bitfield.imm1 = 1;
2325 t.bitfield.imm8 = 1;
2326 t.bitfield.imm8s = 1;
2327 t.bitfield.imm16 = 1;
2328 t.bitfield.imm32 = 1;
2329 t.bitfield.imm32s = 1;
2330 }
2331 else if (fits_in_signed_byte (num))
2332 {
2333 t.bitfield.imm8 = 1;
2334 t.bitfield.imm8s = 1;
2335 t.bitfield.imm16 = 1;
2336 t.bitfield.imm32 = 1;
2337 t.bitfield.imm32s = 1;
2338 }
2339 else if (fits_in_unsigned_byte (num))
2340 {
2341 t.bitfield.imm8 = 1;
2342 t.bitfield.imm16 = 1;
2343 t.bitfield.imm32 = 1;
2344 t.bitfield.imm32s = 1;
2345 }
2346 else if (fits_in_signed_word (num) || fits_in_unsigned_word (num))
2347 {
2348 t.bitfield.imm16 = 1;
2349 t.bitfield.imm32 = 1;
2350 t.bitfield.imm32s = 1;
2351 }
2352 else if (fits_in_signed_long (num))
2353 {
2354 t.bitfield.imm32 = 1;
2355 t.bitfield.imm32s = 1;
2356 }
2357 else if (fits_in_unsigned_long (num))
2358 t.bitfield.imm32 = 1;
2359
2360 return t;
2361 }
2362
2363 static offsetT
2364 offset_in_range (offsetT val, int size)
2365 {
2366 addressT mask;
2367
2368 switch (size)
2369 {
2370 case 1: mask = ((addressT) 1 << 8) - 1; break;
2371 case 2: mask = ((addressT) 1 << 16) - 1; break;
2372 case 4: mask = ((addressT) 2 << 31) - 1; break;
2373 #ifdef BFD64
2374 case 8: mask = ((addressT) 2 << 63) - 1; break;
2375 #endif
2376 default: abort ();
2377 }
2378
2379 #ifdef BFD64
2380 /* If BFD64, sign extend val for 32bit address mode. */
2381 if (flag_code != CODE_64BIT
2382 || i.prefix[ADDR_PREFIX])
2383 if ((val & ~(((addressT) 2 << 31) - 1)) == 0)
2384 val = (val ^ ((addressT) 1 << 31)) - ((addressT) 1 << 31);
2385 #endif
2386
2387 if ((val & ~mask) != 0 && (val & ~mask) != ~mask)
2388 {
2389 char buf1[40], buf2[40];
2390
2391 sprint_value (buf1, val);
2392 sprint_value (buf2, val & mask);
2393 as_warn (_("%s shortened to %s"), buf1, buf2);
2394 }
2395 return val & mask;
2396 }
2397
2398 enum PREFIX_GROUP
2399 {
2400 PREFIX_EXIST = 0,
2401 PREFIX_LOCK,
2402 PREFIX_REP,
2403 PREFIX_DS,
2404 PREFIX_OTHER
2405 };
2406
2407 /* Returns
2408 a. PREFIX_EXIST if attempting to add a prefix where one from the
2409 same class already exists.
2410 b. PREFIX_LOCK if lock prefix is added.
2411 c. PREFIX_REP if rep/repne prefix is added.
2412 d. PREFIX_DS if ds prefix is added.
2413 e. PREFIX_OTHER if other prefix is added.
2414 */
2415
2416 static enum PREFIX_GROUP
2417 add_prefix (unsigned int prefix)
2418 {
2419 enum PREFIX_GROUP ret = PREFIX_OTHER;
2420 unsigned int q;
2421
2422 if (prefix >= REX_OPCODE && prefix < REX_OPCODE + 16
2423 && flag_code == CODE_64BIT)
2424 {
2425 if ((i.prefix[REX_PREFIX] & prefix & REX_W)
2426 || (i.prefix[REX_PREFIX] & prefix & REX_R)
2427 || (i.prefix[REX_PREFIX] & prefix & REX_X)
2428 || (i.prefix[REX_PREFIX] & prefix & REX_B))
2429 ret = PREFIX_EXIST;
2430 q = REX_PREFIX;
2431 }
2432 else
2433 {
2434 switch (prefix)
2435 {
2436 default:
2437 abort ();
2438
2439 case DS_PREFIX_OPCODE:
2440 ret = PREFIX_DS;
2441 /* Fall through. */
2442 case CS_PREFIX_OPCODE:
2443 case ES_PREFIX_OPCODE:
2444 case FS_PREFIX_OPCODE:
2445 case GS_PREFIX_OPCODE:
2446 case SS_PREFIX_OPCODE:
2447 q = SEG_PREFIX;
2448 break;
2449
2450 case REPNE_PREFIX_OPCODE:
2451 case REPE_PREFIX_OPCODE:
2452 q = REP_PREFIX;
2453 ret = PREFIX_REP;
2454 break;
2455
2456 case LOCK_PREFIX_OPCODE:
2457 q = LOCK_PREFIX;
2458 ret = PREFIX_LOCK;
2459 break;
2460
2461 case FWAIT_OPCODE:
2462 q = WAIT_PREFIX;
2463 break;
2464
2465 case ADDR_PREFIX_OPCODE:
2466 q = ADDR_PREFIX;
2467 break;
2468
2469 case DATA_PREFIX_OPCODE:
2470 q = DATA_PREFIX;
2471 break;
2472 }
2473 if (i.prefix[q] != 0)
2474 ret = PREFIX_EXIST;
2475 }
2476
2477 if (ret)
2478 {
2479 if (!i.prefix[q])
2480 ++i.prefixes;
2481 i.prefix[q] |= prefix;
2482 }
2483 else
2484 as_bad (_("same type of prefix used twice"));
2485
2486 return ret;
2487 }
2488
2489 static void
2490 update_code_flag (int value, int check)
2491 {
2492 PRINTF_LIKE ((*as_error));
2493
2494 flag_code = (enum flag_code) value;
2495 if (flag_code == CODE_64BIT)
2496 {
2497 cpu_arch_flags.bitfield.cpu64 = 1;
2498 cpu_arch_flags.bitfield.cpuno64 = 0;
2499 }
2500 else
2501 {
2502 cpu_arch_flags.bitfield.cpu64 = 0;
2503 cpu_arch_flags.bitfield.cpuno64 = 1;
2504 }
2505 if (value == CODE_64BIT && !cpu_arch_flags.bitfield.cpulm )
2506 {
2507 if (check)
2508 as_error = as_fatal;
2509 else
2510 as_error = as_bad;
2511 (*as_error) (_("64bit mode not supported on `%s'."),
2512 cpu_arch_name ? cpu_arch_name : default_arch);
2513 }
2514 if (value == CODE_32BIT && !cpu_arch_flags.bitfield.cpui386)
2515 {
2516 if (check)
2517 as_error = as_fatal;
2518 else
2519 as_error = as_bad;
2520 (*as_error) (_("32bit mode not supported on `%s'."),
2521 cpu_arch_name ? cpu_arch_name : default_arch);
2522 }
2523 stackop_size = '\0';
2524 }
2525
2526 static void
2527 set_code_flag (int value)
2528 {
2529 update_code_flag (value, 0);
2530 }
2531
2532 static void
2533 set_16bit_gcc_code_flag (int new_code_flag)
2534 {
2535 flag_code = (enum flag_code) new_code_flag;
2536 if (flag_code != CODE_16BIT)
2537 abort ();
2538 cpu_arch_flags.bitfield.cpu64 = 0;
2539 cpu_arch_flags.bitfield.cpuno64 = 1;
2540 stackop_size = LONG_MNEM_SUFFIX;
2541 }
2542
2543 static void
2544 set_intel_syntax (int syntax_flag)
2545 {
2546 /* Find out if register prefixing is specified. */
2547 int ask_naked_reg = 0;
2548
2549 SKIP_WHITESPACE ();
2550 if (!is_end_of_line[(unsigned char) *input_line_pointer])
2551 {
2552 char *string;
2553 int e = get_symbol_name (&string);
2554
2555 if (strcmp (string, "prefix") == 0)
2556 ask_naked_reg = 1;
2557 else if (strcmp (string, "noprefix") == 0)
2558 ask_naked_reg = -1;
2559 else
2560 as_bad (_("bad argument to syntax directive."));
2561 (void) restore_line_pointer (e);
2562 }
2563 demand_empty_rest_of_line ();
2564
2565 intel_syntax = syntax_flag;
2566
2567 if (ask_naked_reg == 0)
2568 allow_naked_reg = (intel_syntax
2569 && (bfd_get_symbol_leading_char (stdoutput) != '\0'));
2570 else
2571 allow_naked_reg = (ask_naked_reg < 0);
2572
2573 expr_set_rank (O_full_ptr, syntax_flag ? 10 : 0);
2574
2575 identifier_chars['%'] = intel_syntax && allow_naked_reg ? '%' : 0;
2576 identifier_chars['$'] = intel_syntax ? '$' : 0;
2577 register_prefix = allow_naked_reg ? "" : "%";
2578 }
2579
2580 static void
2581 set_intel_mnemonic (int mnemonic_flag)
2582 {
2583 intel_mnemonic = mnemonic_flag;
2584 }
2585
2586 static void
2587 set_allow_index_reg (int flag)
2588 {
2589 allow_index_reg = flag;
2590 }
2591
2592 static void
2593 set_check (int what)
2594 {
2595 enum check_kind *kind;
2596 const char *str;
2597
2598 if (what)
2599 {
2600 kind = &operand_check;
2601 str = "operand";
2602 }
2603 else
2604 {
2605 kind = &sse_check;
2606 str = "sse";
2607 }
2608
2609 SKIP_WHITESPACE ();
2610
2611 if (!is_end_of_line[(unsigned char) *input_line_pointer])
2612 {
2613 char *string;
2614 int e = get_symbol_name (&string);
2615
2616 if (strcmp (string, "none") == 0)
2617 *kind = check_none;
2618 else if (strcmp (string, "warning") == 0)
2619 *kind = check_warning;
2620 else if (strcmp (string, "error") == 0)
2621 *kind = check_error;
2622 else
2623 as_bad (_("bad argument to %s_check directive."), str);
2624 (void) restore_line_pointer (e);
2625 }
2626 else
2627 as_bad (_("missing argument for %s_check directive"), str);
2628
2629 demand_empty_rest_of_line ();
2630 }
2631
2632 static void
2633 check_cpu_arch_compatible (const char *name ATTRIBUTE_UNUSED,
2634 i386_cpu_flags new_flag ATTRIBUTE_UNUSED)
2635 {
2636 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
2637 static const char *arch;
2638
2639 /* Intel LIOM is only supported on ELF. */
2640 if (!IS_ELF)
2641 return;
2642
2643 if (!arch)
2644 {
2645 /* Use cpu_arch_name if it is set in md_parse_option. Otherwise
2646 use default_arch. */
2647 arch = cpu_arch_name;
2648 if (!arch)
2649 arch = default_arch;
2650 }
2651
2652 /* If we are targeting Intel MCU, we must enable it. */
2653 if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_IAMCU
2654 || new_flag.bitfield.cpuiamcu)
2655 return;
2656
2657 /* If we are targeting Intel L1OM, we must enable it. */
2658 if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_L1OM
2659 || new_flag.bitfield.cpul1om)
2660 return;
2661
2662 /* If we are targeting Intel K1OM, we must enable it. */
2663 if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_K1OM
2664 || new_flag.bitfield.cpuk1om)
2665 return;
2666
2667 as_bad (_("`%s' is not supported on `%s'"), name, arch);
2668 #endif
2669 }
2670
2671 static void
2672 set_cpu_arch (int dummy ATTRIBUTE_UNUSED)
2673 {
2674 SKIP_WHITESPACE ();
2675
2676 if (!is_end_of_line[(unsigned char) *input_line_pointer])
2677 {
2678 char *string;
2679 int e = get_symbol_name (&string);
2680 unsigned int j;
2681 i386_cpu_flags flags;
2682
2683 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
2684 {
2685 if (strcmp (string, cpu_arch[j].name) == 0)
2686 {
2687 check_cpu_arch_compatible (string, cpu_arch[j].flags);
2688
2689 if (*string != '.')
2690 {
2691 cpu_arch_name = cpu_arch[j].name;
2692 cpu_sub_arch_name = NULL;
2693 cpu_arch_flags = cpu_arch[j].flags;
2694 if (flag_code == CODE_64BIT)
2695 {
2696 cpu_arch_flags.bitfield.cpu64 = 1;
2697 cpu_arch_flags.bitfield.cpuno64 = 0;
2698 }
2699 else
2700 {
2701 cpu_arch_flags.bitfield.cpu64 = 0;
2702 cpu_arch_flags.bitfield.cpuno64 = 1;
2703 }
2704 cpu_arch_isa = cpu_arch[j].type;
2705 cpu_arch_isa_flags = cpu_arch[j].flags;
2706 if (!cpu_arch_tune_set)
2707 {
2708 cpu_arch_tune = cpu_arch_isa;
2709 cpu_arch_tune_flags = cpu_arch_isa_flags;
2710 }
2711 break;
2712 }
2713
2714 flags = cpu_flags_or (cpu_arch_flags,
2715 cpu_arch[j].flags);
2716
2717 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
2718 {
2719 if (cpu_sub_arch_name)
2720 {
2721 char *name = cpu_sub_arch_name;
2722 cpu_sub_arch_name = concat (name,
2723 cpu_arch[j].name,
2724 (const char *) NULL);
2725 free (name);
2726 }
2727 else
2728 cpu_sub_arch_name = xstrdup (cpu_arch[j].name);
2729 cpu_arch_flags = flags;
2730 cpu_arch_isa_flags = flags;
2731 }
2732 else
2733 cpu_arch_isa_flags
2734 = cpu_flags_or (cpu_arch_isa_flags,
2735 cpu_arch[j].flags);
2736 (void) restore_line_pointer (e);
2737 demand_empty_rest_of_line ();
2738 return;
2739 }
2740 }
2741
2742 if (*string == '.' && j >= ARRAY_SIZE (cpu_arch))
2743 {
2744 /* Disable an ISA extension. */
2745 for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
2746 if (strcmp (string + 1, cpu_noarch [j].name) == 0)
2747 {
2748 flags = cpu_flags_and_not (cpu_arch_flags,
2749 cpu_noarch[j].flags);
2750 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
2751 {
2752 if (cpu_sub_arch_name)
2753 {
2754 char *name = cpu_sub_arch_name;
2755 cpu_sub_arch_name = concat (name, string,
2756 (const char *) NULL);
2757 free (name);
2758 }
2759 else
2760 cpu_sub_arch_name = xstrdup (string);
2761 cpu_arch_flags = flags;
2762 cpu_arch_isa_flags = flags;
2763 }
2764 (void) restore_line_pointer (e);
2765 demand_empty_rest_of_line ();
2766 return;
2767 }
2768
2769 j = ARRAY_SIZE (cpu_arch);
2770 }
2771
2772 if (j >= ARRAY_SIZE (cpu_arch))
2773 as_bad (_("no such architecture: `%s'"), string);
2774
2775 *input_line_pointer = e;
2776 }
2777 else
2778 as_bad (_("missing cpu architecture"));
2779
2780 no_cond_jump_promotion = 0;
2781 if (*input_line_pointer == ','
2782 && !is_end_of_line[(unsigned char) input_line_pointer[1]])
2783 {
2784 char *string;
2785 char e;
2786
2787 ++input_line_pointer;
2788 e = get_symbol_name (&string);
2789
2790 if (strcmp (string, "nojumps") == 0)
2791 no_cond_jump_promotion = 1;
2792 else if (strcmp (string, "jumps") == 0)
2793 ;
2794 else
2795 as_bad (_("no such architecture modifier: `%s'"), string);
2796
2797 (void) restore_line_pointer (e);
2798 }
2799
2800 demand_empty_rest_of_line ();
2801 }
2802
2803 enum bfd_architecture
2804 i386_arch (void)
2805 {
2806 if (cpu_arch_isa == PROCESSOR_L1OM)
2807 {
2808 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2809 || flag_code != CODE_64BIT)
2810 as_fatal (_("Intel L1OM is 64bit ELF only"));
2811 return bfd_arch_l1om;
2812 }
2813 else if (cpu_arch_isa == PROCESSOR_K1OM)
2814 {
2815 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2816 || flag_code != CODE_64BIT)
2817 as_fatal (_("Intel K1OM is 64bit ELF only"));
2818 return bfd_arch_k1om;
2819 }
2820 else if (cpu_arch_isa == PROCESSOR_IAMCU)
2821 {
2822 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2823 || flag_code == CODE_64BIT)
2824 as_fatal (_("Intel MCU is 32bit ELF only"));
2825 return bfd_arch_iamcu;
2826 }
2827 else
2828 return bfd_arch_i386;
2829 }
2830
2831 unsigned long
2832 i386_mach (void)
2833 {
2834 if (!strncmp (default_arch, "x86_64", 6))
2835 {
2836 if (cpu_arch_isa == PROCESSOR_L1OM)
2837 {
2838 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2839 || default_arch[6] != '\0')
2840 as_fatal (_("Intel L1OM is 64bit ELF only"));
2841 return bfd_mach_l1om;
2842 }
2843 else if (cpu_arch_isa == PROCESSOR_K1OM)
2844 {
2845 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2846 || default_arch[6] != '\0')
2847 as_fatal (_("Intel K1OM is 64bit ELF only"));
2848 return bfd_mach_k1om;
2849 }
2850 else if (default_arch[6] == '\0')
2851 return bfd_mach_x86_64;
2852 else
2853 return bfd_mach_x64_32;
2854 }
2855 else if (!strcmp (default_arch, "i386")
2856 || !strcmp (default_arch, "iamcu"))
2857 {
2858 if (cpu_arch_isa == PROCESSOR_IAMCU)
2859 {
2860 if (OUTPUT_FLAVOR != bfd_target_elf_flavour)
2861 as_fatal (_("Intel MCU is 32bit ELF only"));
2862 return bfd_mach_i386_iamcu;
2863 }
2864 else
2865 return bfd_mach_i386_i386;
2866 }
2867 else
2868 as_fatal (_("unknown architecture"));
2869 }
2870 \f
2871 void
2872 md_begin (void)
2873 {
2874 const char *hash_err;
2875
2876 /* Support pseudo prefixes like {disp32}. */
2877 lex_type ['{'] = LEX_BEGIN_NAME;
2878
2879 /* Initialize op_hash hash table. */
2880 op_hash = hash_new ();
2881
2882 {
2883 const insn_template *optab;
2884 templates *core_optab;
2885
2886 /* Setup for loop. */
2887 optab = i386_optab;
2888 core_optab = XNEW (templates);
2889 core_optab->start = optab;
2890
2891 while (1)
2892 {
2893 ++optab;
2894 if (optab->name == NULL
2895 || strcmp (optab->name, (optab - 1)->name) != 0)
2896 {
2897 /* different name --> ship out current template list;
2898 add to hash table; & begin anew. */
2899 core_optab->end = optab;
2900 hash_err = hash_insert (op_hash,
2901 (optab - 1)->name,
2902 (void *) core_optab);
2903 if (hash_err)
2904 {
2905 as_fatal (_("can't hash %s: %s"),
2906 (optab - 1)->name,
2907 hash_err);
2908 }
2909 if (optab->name == NULL)
2910 break;
2911 core_optab = XNEW (templates);
2912 core_optab->start = optab;
2913 }
2914 }
2915 }
2916
2917 /* Initialize reg_hash hash table. */
2918 reg_hash = hash_new ();
2919 {
2920 const reg_entry *regtab;
2921 unsigned int regtab_size = i386_regtab_size;
2922
2923 for (regtab = i386_regtab; regtab_size--; regtab++)
2924 {
2925 hash_err = hash_insert (reg_hash, regtab->reg_name, (void *) regtab);
2926 if (hash_err)
2927 as_fatal (_("can't hash %s: %s"),
2928 regtab->reg_name,
2929 hash_err);
2930 }
2931 }
2932
2933 /* Fill in lexical tables: mnemonic_chars, operand_chars. */
2934 {
2935 int c;
2936 char *p;
2937
2938 for (c = 0; c < 256; c++)
2939 {
2940 if (ISDIGIT (c))
2941 {
2942 digit_chars[c] = c;
2943 mnemonic_chars[c] = c;
2944 register_chars[c] = c;
2945 operand_chars[c] = c;
2946 }
2947 else if (ISLOWER (c))
2948 {
2949 mnemonic_chars[c] = c;
2950 register_chars[c] = c;
2951 operand_chars[c] = c;
2952 }
2953 else if (ISUPPER (c))
2954 {
2955 mnemonic_chars[c] = TOLOWER (c);
2956 register_chars[c] = mnemonic_chars[c];
2957 operand_chars[c] = c;
2958 }
2959 else if (c == '{' || c == '}')
2960 {
2961 mnemonic_chars[c] = c;
2962 operand_chars[c] = c;
2963 }
2964
2965 if (ISALPHA (c) || ISDIGIT (c))
2966 identifier_chars[c] = c;
2967 else if (c >= 128)
2968 {
2969 identifier_chars[c] = c;
2970 operand_chars[c] = c;
2971 }
2972 }
2973
2974 #ifdef LEX_AT
2975 identifier_chars['@'] = '@';
2976 #endif
2977 #ifdef LEX_QM
2978 identifier_chars['?'] = '?';
2979 operand_chars['?'] = '?';
2980 #endif
2981 digit_chars['-'] = '-';
2982 mnemonic_chars['_'] = '_';
2983 mnemonic_chars['-'] = '-';
2984 mnemonic_chars['.'] = '.';
2985 identifier_chars['_'] = '_';
2986 identifier_chars['.'] = '.';
2987
2988 for (p = operand_special_chars; *p != '\0'; p++)
2989 operand_chars[(unsigned char) *p] = *p;
2990 }
2991
2992 if (flag_code == CODE_64BIT)
2993 {
2994 #if defined (OBJ_COFF) && defined (TE_PE)
2995 x86_dwarf2_return_column = (OUTPUT_FLAVOR == bfd_target_coff_flavour
2996 ? 32 : 16);
2997 #else
2998 x86_dwarf2_return_column = 16;
2999 #endif
3000 x86_cie_data_alignment = -8;
3001 }
3002 else
3003 {
3004 x86_dwarf2_return_column = 8;
3005 x86_cie_data_alignment = -4;
3006 }
3007 }
3008
3009 void
3010 i386_print_statistics (FILE *file)
3011 {
3012 hash_print_statistics (file, "i386 opcode", op_hash);
3013 hash_print_statistics (file, "i386 register", reg_hash);
3014 }
3015 \f
3016 #ifdef DEBUG386
3017
3018 /* Debugging routines for md_assemble. */
3019 static void pte (insn_template *);
3020 static void pt (i386_operand_type);
3021 static void pe (expressionS *);
3022 static void ps (symbolS *);
3023
3024 static void
3025 pi (const char *line, i386_insn *x)
3026 {
3027 unsigned int j;
3028
3029 fprintf (stdout, "%s: template ", line);
3030 pte (&x->tm);
3031 fprintf (stdout, " address: base %s index %s scale %x\n",
3032 x->base_reg ? x->base_reg->reg_name : "none",
3033 x->index_reg ? x->index_reg->reg_name : "none",
3034 x->log2_scale_factor);
3035 fprintf (stdout, " modrm: mode %x reg %x reg/mem %x\n",
3036 x->rm.mode, x->rm.reg, x->rm.regmem);
3037 fprintf (stdout, " sib: base %x index %x scale %x\n",
3038 x->sib.base, x->sib.index, x->sib.scale);
3039 fprintf (stdout, " rex: 64bit %x extX %x extY %x extZ %x\n",
3040 (x->rex & REX_W) != 0,
3041 (x->rex & REX_R) != 0,
3042 (x->rex & REX_X) != 0,
3043 (x->rex & REX_B) != 0);
3044 for (j = 0; j < x->operands; j++)
3045 {
3046 fprintf (stdout, " #%d: ", j + 1);
3047 pt (x->types[j]);
3048 fprintf (stdout, "\n");
3049 if (x->types[j].bitfield.class == Reg
3050 || x->types[j].bitfield.class == RegMMX
3051 || x->types[j].bitfield.class == RegSIMD
3052 || x->types[j].bitfield.class == SReg
3053 || x->types[j].bitfield.class == RegCR
3054 || x->types[j].bitfield.class == RegDR
3055 || x->types[j].bitfield.class == RegTR)
3056 fprintf (stdout, "%s\n", x->op[j].regs->reg_name);
3057 if (operand_type_check (x->types[j], imm))
3058 pe (x->op[j].imms);
3059 if (operand_type_check (x->types[j], disp))
3060 pe (x->op[j].disps);
3061 }
3062 }
3063
3064 static void
3065 pte (insn_template *t)
3066 {
3067 unsigned int j;
3068 fprintf (stdout, " %d operands ", t->operands);
3069 fprintf (stdout, "opcode %x ", t->base_opcode);
3070 if (t->extension_opcode != None)
3071 fprintf (stdout, "ext %x ", t->extension_opcode);
3072 if (t->opcode_modifier.d)
3073 fprintf (stdout, "D");
3074 if (t->opcode_modifier.w)
3075 fprintf (stdout, "W");
3076 fprintf (stdout, "\n");
3077 for (j = 0; j < t->operands; j++)
3078 {
3079 fprintf (stdout, " #%d type ", j + 1);
3080 pt (t->operand_types[j]);
3081 fprintf (stdout, "\n");
3082 }
3083 }
3084
3085 static void
3086 pe (expressionS *e)
3087 {
3088 fprintf (stdout, " operation %d\n", e->X_op);
3089 fprintf (stdout, " add_number %ld (%lx)\n",
3090 (long) e->X_add_number, (long) e->X_add_number);
3091 if (e->X_add_symbol)
3092 {
3093 fprintf (stdout, " add_symbol ");
3094 ps (e->X_add_symbol);
3095 fprintf (stdout, "\n");
3096 }
3097 if (e->X_op_symbol)
3098 {
3099 fprintf (stdout, " op_symbol ");
3100 ps (e->X_op_symbol);
3101 fprintf (stdout, "\n");
3102 }
3103 }
3104
3105 static void
3106 ps (symbolS *s)
3107 {
3108 fprintf (stdout, "%s type %s%s",
3109 S_GET_NAME (s),
3110 S_IS_EXTERNAL (s) ? "EXTERNAL " : "",
3111 segment_name (S_GET_SEGMENT (s)));
3112 }
3113
3114 static struct type_name
3115 {
3116 i386_operand_type mask;
3117 const char *name;
3118 }
3119 const type_names[] =
3120 {
3121 { OPERAND_TYPE_REG8, "r8" },
3122 { OPERAND_TYPE_REG16, "r16" },
3123 { OPERAND_TYPE_REG32, "r32" },
3124 { OPERAND_TYPE_REG64, "r64" },
3125 { OPERAND_TYPE_ACC8, "acc8" },
3126 { OPERAND_TYPE_ACC16, "acc16" },
3127 { OPERAND_TYPE_ACC32, "acc32" },
3128 { OPERAND_TYPE_ACC64, "acc64" },
3129 { OPERAND_TYPE_IMM8, "i8" },
3130 { OPERAND_TYPE_IMM8, "i8s" },
3131 { OPERAND_TYPE_IMM16, "i16" },
3132 { OPERAND_TYPE_IMM32, "i32" },
3133 { OPERAND_TYPE_IMM32S, "i32s" },
3134 { OPERAND_TYPE_IMM64, "i64" },
3135 { OPERAND_TYPE_IMM1, "i1" },
3136 { OPERAND_TYPE_BASEINDEX, "BaseIndex" },
3137 { OPERAND_TYPE_DISP8, "d8" },
3138 { OPERAND_TYPE_DISP16, "d16" },
3139 { OPERAND_TYPE_DISP32, "d32" },
3140 { OPERAND_TYPE_DISP32S, "d32s" },
3141 { OPERAND_TYPE_DISP64, "d64" },
3142 { OPERAND_TYPE_INOUTPORTREG, "InOutPortReg" },
3143 { OPERAND_TYPE_SHIFTCOUNT, "ShiftCount" },
3144 { OPERAND_TYPE_CONTROL, "control reg" },
3145 { OPERAND_TYPE_TEST, "test reg" },
3146 { OPERAND_TYPE_DEBUG, "debug reg" },
3147 { OPERAND_TYPE_FLOATREG, "FReg" },
3148 { OPERAND_TYPE_FLOATACC, "FAcc" },
3149 { OPERAND_TYPE_SREG, "SReg" },
3150 { OPERAND_TYPE_JUMPABSOLUTE, "Jump Absolute" },
3151 { OPERAND_TYPE_REGMMX, "rMMX" },
3152 { OPERAND_TYPE_REGXMM, "rXMM" },
3153 { OPERAND_TYPE_REGYMM, "rYMM" },
3154 { OPERAND_TYPE_REGZMM, "rZMM" },
3155 { OPERAND_TYPE_REGMASK, "Mask reg" },
3156 { OPERAND_TYPE_ESSEG, "es" },
3157 };
3158
3159 static void
3160 pt (i386_operand_type t)
3161 {
3162 unsigned int j;
3163 i386_operand_type a;
3164
3165 for (j = 0; j < ARRAY_SIZE (type_names); j++)
3166 {
3167 a = operand_type_and (t, type_names[j].mask);
3168 if (operand_type_equal (&a, &type_names[j].mask))
3169 fprintf (stdout, "%s, ", type_names[j].name);
3170 }
3171 fflush (stdout);
3172 }
3173
3174 #endif /* DEBUG386 */
3175 \f
3176 static bfd_reloc_code_real_type
3177 reloc (unsigned int size,
3178 int pcrel,
3179 int sign,
3180 bfd_reloc_code_real_type other)
3181 {
3182 if (other != NO_RELOC)
3183 {
3184 reloc_howto_type *rel;
3185
3186 if (size == 8)
3187 switch (other)
3188 {
3189 case BFD_RELOC_X86_64_GOT32:
3190 return BFD_RELOC_X86_64_GOT64;
3191 break;
3192 case BFD_RELOC_X86_64_GOTPLT64:
3193 return BFD_RELOC_X86_64_GOTPLT64;
3194 break;
3195 case BFD_RELOC_X86_64_PLTOFF64:
3196 return BFD_RELOC_X86_64_PLTOFF64;
3197 break;
3198 case BFD_RELOC_X86_64_GOTPC32:
3199 other = BFD_RELOC_X86_64_GOTPC64;
3200 break;
3201 case BFD_RELOC_X86_64_GOTPCREL:
3202 other = BFD_RELOC_X86_64_GOTPCREL64;
3203 break;
3204 case BFD_RELOC_X86_64_TPOFF32:
3205 other = BFD_RELOC_X86_64_TPOFF64;
3206 break;
3207 case BFD_RELOC_X86_64_DTPOFF32:
3208 other = BFD_RELOC_X86_64_DTPOFF64;
3209 break;
3210 default:
3211 break;
3212 }
3213
3214 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
3215 if (other == BFD_RELOC_SIZE32)
3216 {
3217 if (size == 8)
3218 other = BFD_RELOC_SIZE64;
3219 if (pcrel)
3220 {
3221 as_bad (_("there are no pc-relative size relocations"));
3222 return NO_RELOC;
3223 }
3224 }
3225 #endif
3226
3227 /* Sign-checking 4-byte relocations in 16-/32-bit code is pointless. */
3228 if (size == 4 && (flag_code != CODE_64BIT || disallow_64bit_reloc))
3229 sign = -1;
3230
3231 rel = bfd_reloc_type_lookup (stdoutput, other);
3232 if (!rel)
3233 as_bad (_("unknown relocation (%u)"), other);
3234 else if (size != bfd_get_reloc_size (rel))
3235 as_bad (_("%u-byte relocation cannot be applied to %u-byte field"),
3236 bfd_get_reloc_size (rel),
3237 size);
3238 else if (pcrel && !rel->pc_relative)
3239 as_bad (_("non-pc-relative relocation for pc-relative field"));
3240 else if ((rel->complain_on_overflow == complain_overflow_signed
3241 && !sign)
3242 || (rel->complain_on_overflow == complain_overflow_unsigned
3243 && sign > 0))
3244 as_bad (_("relocated field and relocation type differ in signedness"));
3245 else
3246 return other;
3247 return NO_RELOC;
3248 }
3249
3250 if (pcrel)
3251 {
3252 if (!sign)
3253 as_bad (_("there are no unsigned pc-relative relocations"));
3254 switch (size)
3255 {
3256 case 1: return BFD_RELOC_8_PCREL;
3257 case 2: return BFD_RELOC_16_PCREL;
3258 case 4: return BFD_RELOC_32_PCREL;
3259 case 8: return BFD_RELOC_64_PCREL;
3260 }
3261 as_bad (_("cannot do %u byte pc-relative relocation"), size);
3262 }
3263 else
3264 {
3265 if (sign > 0)
3266 switch (size)
3267 {
3268 case 4: return BFD_RELOC_X86_64_32S;
3269 }
3270 else
3271 switch (size)
3272 {
3273 case 1: return BFD_RELOC_8;
3274 case 2: return BFD_RELOC_16;
3275 case 4: return BFD_RELOC_32;
3276 case 8: return BFD_RELOC_64;
3277 }
3278 as_bad (_("cannot do %s %u byte relocation"),
3279 sign > 0 ? "signed" : "unsigned", size);
3280 }
3281
3282 return NO_RELOC;
3283 }
3284
3285 /* Here we decide which fixups can be adjusted to make them relative to
3286 the beginning of the section instead of the symbol. Basically we need
3287 to make sure that the dynamic relocations are done correctly, so in
3288 some cases we force the original symbol to be used. */
3289
3290 int
3291 tc_i386_fix_adjustable (fixS *fixP ATTRIBUTE_UNUSED)
3292 {
3293 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
3294 if (!IS_ELF)
3295 return 1;
3296
3297 /* Don't adjust pc-relative references to merge sections in 64-bit
3298 mode. */
3299 if (use_rela_relocations
3300 && (S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_MERGE) != 0
3301 && fixP->fx_pcrel)
3302 return 0;
3303
3304 /* The x86_64 GOTPCREL are represented as 32bit PCrel relocations
3305 and changed later by validate_fix. */
3306 if (GOT_symbol && fixP->fx_subsy == GOT_symbol
3307 && fixP->fx_r_type == BFD_RELOC_32_PCREL)
3308 return 0;
3309
3310 /* Adjust_reloc_syms doesn't know about the GOT. Need to keep symbol
3311 for size relocations. */
3312 if (fixP->fx_r_type == BFD_RELOC_SIZE32
3313 || fixP->fx_r_type == BFD_RELOC_SIZE64
3314 || fixP->fx_r_type == BFD_RELOC_386_GOTOFF
3315 || fixP->fx_r_type == BFD_RELOC_386_PLT32
3316 || fixP->fx_r_type == BFD_RELOC_386_GOT32
3317 || fixP->fx_r_type == BFD_RELOC_386_GOT32X
3318 || fixP->fx_r_type == BFD_RELOC_386_TLS_GD
3319 || fixP->fx_r_type == BFD_RELOC_386_TLS_LDM
3320 || fixP->fx_r_type == BFD_RELOC_386_TLS_LDO_32
3321 || fixP->fx_r_type == BFD_RELOC_386_TLS_IE_32
3322 || fixP->fx_r_type == BFD_RELOC_386_TLS_IE
3323 || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTIE
3324 || fixP->fx_r_type == BFD_RELOC_386_TLS_LE_32
3325 || fixP->fx_r_type == BFD_RELOC_386_TLS_LE
3326 || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTDESC
3327 || fixP->fx_r_type == BFD_RELOC_386_TLS_DESC_CALL
3328 || fixP->fx_r_type == BFD_RELOC_X86_64_PLT32
3329 || fixP->fx_r_type == BFD_RELOC_X86_64_GOT32
3330 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCREL
3331 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCRELX
3332 || fixP->fx_r_type == BFD_RELOC_X86_64_REX_GOTPCRELX
3333 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSGD
3334 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSLD
3335 || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF32
3336 || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF64
3337 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTTPOFF
3338 || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF32
3339 || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF64
3340 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTOFF64
3341 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPC32_TLSDESC
3342 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSDESC_CALL
3343 || fixP->fx_r_type == BFD_RELOC_VTABLE_INHERIT
3344 || fixP->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
3345 return 0;
3346 #endif
3347 return 1;
3348 }
3349
3350 static int
3351 intel_float_operand (const char *mnemonic)
3352 {
3353 /* Note that the value returned is meaningful only for opcodes with (memory)
3354 operands, hence the code here is free to improperly handle opcodes that
3355 have no operands (for better performance and smaller code). */
3356
3357 if (mnemonic[0] != 'f')
3358 return 0; /* non-math */
3359
3360 switch (mnemonic[1])
3361 {
3362 /* fclex, fdecstp, fdisi, femms, feni, fincstp, finit, fsetpm, and
3363 the fs segment override prefix not currently handled because no
3364 call path can make opcodes without operands get here */
3365 case 'i':
3366 return 2 /* integer op */;
3367 case 'l':
3368 if (mnemonic[2] == 'd' && (mnemonic[3] == 'c' || mnemonic[3] == 'e'))
3369 return 3; /* fldcw/fldenv */
3370 break;
3371 case 'n':
3372 if (mnemonic[2] != 'o' /* fnop */)
3373 return 3; /* non-waiting control op */
3374 break;
3375 case 'r':
3376 if (mnemonic[2] == 's')
3377 return 3; /* frstor/frstpm */
3378 break;
3379 case 's':
3380 if (mnemonic[2] == 'a')
3381 return 3; /* fsave */
3382 if (mnemonic[2] == 't')
3383 {
3384 switch (mnemonic[3])
3385 {
3386 case 'c': /* fstcw */
3387 case 'd': /* fstdw */
3388 case 'e': /* fstenv */
3389 case 's': /* fsts[gw] */
3390 return 3;
3391 }
3392 }
3393 break;
3394 case 'x':
3395 if (mnemonic[2] == 'r' || mnemonic[2] == 's')
3396 return 0; /* fxsave/fxrstor are not really math ops */
3397 break;
3398 }
3399
3400 return 1;
3401 }
3402
3403 /* Build the VEX prefix. */
3404
3405 static void
3406 build_vex_prefix (const insn_template *t)
3407 {
3408 unsigned int register_specifier;
3409 unsigned int implied_prefix;
3410 unsigned int vector_length;
3411 unsigned int w;
3412
3413 /* Check register specifier. */
3414 if (i.vex.register_specifier)
3415 {
3416 register_specifier =
3417 ~register_number (i.vex.register_specifier) & 0xf;
3418 gas_assert ((i.vex.register_specifier->reg_flags & RegVRex) == 0);
3419 }
3420 else
3421 register_specifier = 0xf;
3422
3423 /* Use 2-byte VEX prefix by swapping destination and source operand
3424 if there are more than 1 register operand. */
3425 if (i.reg_operands > 1
3426 && i.vec_encoding != vex_encoding_vex3
3427 && i.dir_encoding == dir_encoding_default
3428 && i.operands == i.reg_operands
3429 && operand_type_equal (&i.types[0], &i.types[i.operands - 1])
3430 && i.tm.opcode_modifier.vexopcode == VEX0F
3431 && (i.tm.opcode_modifier.load || i.tm.opcode_modifier.d)
3432 && i.rex == REX_B)
3433 {
3434 unsigned int xchg = i.operands - 1;
3435 union i386_op temp_op;
3436 i386_operand_type temp_type;
3437
3438 temp_type = i.types[xchg];
3439 i.types[xchg] = i.types[0];
3440 i.types[0] = temp_type;
3441 temp_op = i.op[xchg];
3442 i.op[xchg] = i.op[0];
3443 i.op[0] = temp_op;
3444
3445 gas_assert (i.rm.mode == 3);
3446
3447 i.rex = REX_R;
3448 xchg = i.rm.regmem;
3449 i.rm.regmem = i.rm.reg;
3450 i.rm.reg = xchg;
3451
3452 if (i.tm.opcode_modifier.d)
3453 i.tm.base_opcode ^= (i.tm.base_opcode & 0xee) != 0x6e
3454 ? Opcode_SIMD_FloatD : Opcode_SIMD_IntD;
3455 else /* Use the next insn. */
3456 i.tm = t[1];
3457 }
3458
3459 /* Use 2-byte VEX prefix by swapping commutative source operands if there
3460 are no memory operands and at least 3 register ones. */
3461 if (i.reg_operands >= 3
3462 && i.vec_encoding != vex_encoding_vex3
3463 && i.reg_operands == i.operands - i.imm_operands
3464 && i.tm.opcode_modifier.vex
3465 && i.tm.opcode_modifier.commutative
3466 && (i.tm.opcode_modifier.sse2avx || optimize > 1)
3467 && i.rex == REX_B
3468 && i.vex.register_specifier
3469 && !(i.vex.register_specifier->reg_flags & RegRex))
3470 {
3471 unsigned int xchg = i.operands - i.reg_operands;
3472 union i386_op temp_op;
3473 i386_operand_type temp_type;
3474
3475 gas_assert (i.tm.opcode_modifier.vexopcode == VEX0F);
3476 gas_assert (!i.tm.opcode_modifier.sae);
3477 gas_assert (operand_type_equal (&i.types[i.operands - 2],
3478 &i.types[i.operands - 3]));
3479 gas_assert (i.rm.mode == 3);
3480
3481 temp_type = i.types[xchg];
3482 i.types[xchg] = i.types[xchg + 1];
3483 i.types[xchg + 1] = temp_type;
3484 temp_op = i.op[xchg];
3485 i.op[xchg] = i.op[xchg + 1];
3486 i.op[xchg + 1] = temp_op;
3487
3488 i.rex = 0;
3489 xchg = i.rm.regmem | 8;
3490 i.rm.regmem = ~register_specifier & 0xf;
3491 gas_assert (!(i.rm.regmem & 8));
3492 i.vex.register_specifier += xchg - i.rm.regmem;
3493 register_specifier = ~xchg & 0xf;
3494 }
3495
3496 if (i.tm.opcode_modifier.vex == VEXScalar)
3497 vector_length = avxscalar;
3498 else if (i.tm.opcode_modifier.vex == VEX256)
3499 vector_length = 1;
3500 else
3501 {
3502 unsigned int op;
3503
3504 /* Determine vector length from the last multi-length vector
3505 operand. */
3506 vector_length = 0;
3507 for (op = t->operands; op--;)
3508 if (t->operand_types[op].bitfield.xmmword
3509 && t->operand_types[op].bitfield.ymmword
3510 && i.types[op].bitfield.ymmword)
3511 {
3512 vector_length = 1;
3513 break;
3514 }
3515 }
3516
3517 switch ((i.tm.base_opcode >> 8) & 0xff)
3518 {
3519 case 0:
3520 implied_prefix = 0;
3521 break;
3522 case DATA_PREFIX_OPCODE:
3523 implied_prefix = 1;
3524 break;
3525 case REPE_PREFIX_OPCODE:
3526 implied_prefix = 2;
3527 break;
3528 case REPNE_PREFIX_OPCODE:
3529 implied_prefix = 3;
3530 break;
3531 default:
3532 abort ();
3533 }
3534
3535 /* Check the REX.W bit and VEXW. */
3536 if (i.tm.opcode_modifier.vexw == VEXWIG)
3537 w = (vexwig == vexw1 || (i.rex & REX_W)) ? 1 : 0;
3538 else if (i.tm.opcode_modifier.vexw)
3539 w = i.tm.opcode_modifier.vexw == VEXW1 ? 1 : 0;
3540 else
3541 w = (flag_code == CODE_64BIT ? i.rex & REX_W : vexwig == vexw1) ? 1 : 0;
3542
3543 /* Use 2-byte VEX prefix if possible. */
3544 if (w == 0
3545 && i.vec_encoding != vex_encoding_vex3
3546 && i.tm.opcode_modifier.vexopcode == VEX0F
3547 && (i.rex & (REX_W | REX_X | REX_B)) == 0)
3548 {
3549 /* 2-byte VEX prefix. */
3550 unsigned int r;
3551
3552 i.vex.length = 2;
3553 i.vex.bytes[0] = 0xc5;
3554
3555 /* Check the REX.R bit. */
3556 r = (i.rex & REX_R) ? 0 : 1;
3557 i.vex.bytes[1] = (r << 7
3558 | register_specifier << 3
3559 | vector_length << 2
3560 | implied_prefix);
3561 }
3562 else
3563 {
3564 /* 3-byte VEX prefix. */
3565 unsigned int m;
3566
3567 i.vex.length = 3;
3568
3569 switch (i.tm.opcode_modifier.vexopcode)
3570 {
3571 case VEX0F:
3572 m = 0x1;
3573 i.vex.bytes[0] = 0xc4;
3574 break;
3575 case VEX0F38:
3576 m = 0x2;
3577 i.vex.bytes[0] = 0xc4;
3578 break;
3579 case VEX0F3A:
3580 m = 0x3;
3581 i.vex.bytes[0] = 0xc4;
3582 break;
3583 case XOP08:
3584 m = 0x8;
3585 i.vex.bytes[0] = 0x8f;
3586 break;
3587 case XOP09:
3588 m = 0x9;
3589 i.vex.bytes[0] = 0x8f;
3590 break;
3591 case XOP0A:
3592 m = 0xa;
3593 i.vex.bytes[0] = 0x8f;
3594 break;
3595 default:
3596 abort ();
3597 }
3598
3599 /* The high 3 bits of the second VEX byte are 1's compliment
3600 of RXB bits from REX. */
3601 i.vex.bytes[1] = (~i.rex & 0x7) << 5 | m;
3602
3603 i.vex.bytes[2] = (w << 7
3604 | register_specifier << 3
3605 | vector_length << 2
3606 | implied_prefix);
3607 }
3608 }
3609
3610 static INLINE bfd_boolean
3611 is_evex_encoding (const insn_template *t)
3612 {
3613 return t->opcode_modifier.evex || t->opcode_modifier.disp8memshift
3614 || t->opcode_modifier.broadcast || t->opcode_modifier.masking
3615 || t->opcode_modifier.sae;
3616 }
3617
3618 static INLINE bfd_boolean
3619 is_any_vex_encoding (const insn_template *t)
3620 {
3621 return t->opcode_modifier.vex || t->opcode_modifier.vexopcode
3622 || is_evex_encoding (t);
3623 }
3624
3625 /* Build the EVEX prefix. */
3626
3627 static void
3628 build_evex_prefix (void)
3629 {
3630 unsigned int register_specifier;
3631 unsigned int implied_prefix;
3632 unsigned int m, w;
3633 rex_byte vrex_used = 0;
3634
3635 /* Check register specifier. */
3636 if (i.vex.register_specifier)
3637 {
3638 gas_assert ((i.vrex & REX_X) == 0);
3639
3640 register_specifier = i.vex.register_specifier->reg_num;
3641 if ((i.vex.register_specifier->reg_flags & RegRex))
3642 register_specifier += 8;
3643 /* The upper 16 registers are encoded in the fourth byte of the
3644 EVEX prefix. */
3645 if (!(i.vex.register_specifier->reg_flags & RegVRex))
3646 i.vex.bytes[3] = 0x8;
3647 register_specifier = ~register_specifier & 0xf;
3648 }
3649 else
3650 {
3651 register_specifier = 0xf;
3652
3653 /* Encode upper 16 vector index register in the fourth byte of
3654 the EVEX prefix. */
3655 if (!(i.vrex & REX_X))
3656 i.vex.bytes[3] = 0x8;
3657 else
3658 vrex_used |= REX_X;
3659 }
3660
3661 switch ((i.tm.base_opcode >> 8) & 0xff)
3662 {
3663 case 0:
3664 implied_prefix = 0;
3665 break;
3666 case DATA_PREFIX_OPCODE:
3667 implied_prefix = 1;
3668 break;
3669 case REPE_PREFIX_OPCODE:
3670 implied_prefix = 2;
3671 break;
3672 case REPNE_PREFIX_OPCODE:
3673 implied_prefix = 3;
3674 break;
3675 default:
3676 abort ();
3677 }
3678
3679 /* 4 byte EVEX prefix. */
3680 i.vex.length = 4;
3681 i.vex.bytes[0] = 0x62;
3682
3683 /* mmmm bits. */
3684 switch (i.tm.opcode_modifier.vexopcode)
3685 {
3686 case VEX0F:
3687 m = 1;
3688 break;
3689 case VEX0F38:
3690 m = 2;
3691 break;
3692 case VEX0F3A:
3693 m = 3;
3694 break;
3695 default:
3696 abort ();
3697 break;
3698 }
3699
3700 /* The high 3 bits of the second EVEX byte are 1's compliment of RXB
3701 bits from REX. */
3702 i.vex.bytes[1] = (~i.rex & 0x7) << 5 | m;
3703
3704 /* The fifth bit of the second EVEX byte is 1's compliment of the
3705 REX_R bit in VREX. */
3706 if (!(i.vrex & REX_R))
3707 i.vex.bytes[1] |= 0x10;
3708 else
3709 vrex_used |= REX_R;
3710
3711 if ((i.reg_operands + i.imm_operands) == i.operands)
3712 {
3713 /* When all operands are registers, the REX_X bit in REX is not
3714 used. We reuse it to encode the upper 16 registers, which is
3715 indicated by the REX_B bit in VREX. The REX_X bit is encoded
3716 as 1's compliment. */
3717 if ((i.vrex & REX_B))
3718 {
3719 vrex_used |= REX_B;
3720 i.vex.bytes[1] &= ~0x40;
3721 }
3722 }
3723
3724 /* EVEX instructions shouldn't need the REX prefix. */
3725 i.vrex &= ~vrex_used;
3726 gas_assert (i.vrex == 0);
3727
3728 /* Check the REX.W bit and VEXW. */
3729 if (i.tm.opcode_modifier.vexw == VEXWIG)
3730 w = (evexwig == evexw1 || (i.rex & REX_W)) ? 1 : 0;
3731 else if (i.tm.opcode_modifier.vexw)
3732 w = i.tm.opcode_modifier.vexw == VEXW1 ? 1 : 0;
3733 else
3734 w = (flag_code == CODE_64BIT ? i.rex & REX_W : evexwig == evexw1) ? 1 : 0;
3735
3736 /* Encode the U bit. */
3737 implied_prefix |= 0x4;
3738
3739 /* The third byte of the EVEX prefix. */
3740 i.vex.bytes[2] = (w << 7 | register_specifier << 3 | implied_prefix);
3741
3742 /* The fourth byte of the EVEX prefix. */
3743 /* The zeroing-masking bit. */
3744 if (i.mask && i.mask->zeroing)
3745 i.vex.bytes[3] |= 0x80;
3746
3747 /* Don't always set the broadcast bit if there is no RC. */
3748 if (!i.rounding)
3749 {
3750 /* Encode the vector length. */
3751 unsigned int vec_length;
3752
3753 if (!i.tm.opcode_modifier.evex
3754 || i.tm.opcode_modifier.evex == EVEXDYN)
3755 {
3756 unsigned int op;
3757
3758 /* Determine vector length from the last multi-length vector
3759 operand. */
3760 vec_length = 0;
3761 for (op = i.operands; op--;)
3762 if (i.tm.operand_types[op].bitfield.xmmword
3763 + i.tm.operand_types[op].bitfield.ymmword
3764 + i.tm.operand_types[op].bitfield.zmmword > 1)
3765 {
3766 if (i.types[op].bitfield.zmmword)
3767 {
3768 i.tm.opcode_modifier.evex = EVEX512;
3769 break;
3770 }
3771 else if (i.types[op].bitfield.ymmword)
3772 {
3773 i.tm.opcode_modifier.evex = EVEX256;
3774 break;
3775 }
3776 else if (i.types[op].bitfield.xmmword)
3777 {
3778 i.tm.opcode_modifier.evex = EVEX128;
3779 break;
3780 }
3781 else if (i.broadcast && (int) op == i.broadcast->operand)
3782 {
3783 switch (i.broadcast->bytes)
3784 {
3785 case 64:
3786 i.tm.opcode_modifier.evex = EVEX512;
3787 break;
3788 case 32:
3789 i.tm.opcode_modifier.evex = EVEX256;
3790 break;
3791 case 16:
3792 i.tm.opcode_modifier.evex = EVEX128;
3793 break;
3794 default:
3795 abort ();
3796 }
3797 break;
3798 }
3799 }
3800
3801 if (op >= MAX_OPERANDS)
3802 abort ();
3803 }
3804
3805 switch (i.tm.opcode_modifier.evex)
3806 {
3807 case EVEXLIG: /* LL' is ignored */
3808 vec_length = evexlig << 5;
3809 break;
3810 case EVEX128:
3811 vec_length = 0 << 5;
3812 break;
3813 case EVEX256:
3814 vec_length = 1 << 5;
3815 break;
3816 case EVEX512:
3817 vec_length = 2 << 5;
3818 break;
3819 default:
3820 abort ();
3821 break;
3822 }
3823 i.vex.bytes[3] |= vec_length;
3824 /* Encode the broadcast bit. */
3825 if (i.broadcast)
3826 i.vex.bytes[3] |= 0x10;
3827 }
3828 else
3829 {
3830 if (i.rounding->type != saeonly)
3831 i.vex.bytes[3] |= 0x10 | (i.rounding->type << 5);
3832 else
3833 i.vex.bytes[3] |= 0x10 | (evexrcig << 5);
3834 }
3835
3836 if (i.mask && i.mask->mask)
3837 i.vex.bytes[3] |= i.mask->mask->reg_num;
3838 }
3839
3840 static void
3841 process_immext (void)
3842 {
3843 expressionS *exp;
3844
3845 if ((i.tm.cpu_flags.bitfield.cpusse3 || i.tm.cpu_flags.bitfield.cpusvme)
3846 && i.operands > 0)
3847 {
3848 /* MONITOR/MWAIT as well as SVME instructions have fixed operands
3849 with an opcode suffix which is coded in the same place as an
3850 8-bit immediate field would be.
3851 Here we check those operands and remove them afterwards. */
3852 unsigned int x;
3853
3854 for (x = 0; x < i.operands; x++)
3855 if (register_number (i.op[x].regs) != x)
3856 as_bad (_("can't use register '%s%s' as operand %d in '%s'."),
3857 register_prefix, i.op[x].regs->reg_name, x + 1,
3858 i.tm.name);
3859
3860 i.operands = 0;
3861 }
3862
3863 if (i.tm.cpu_flags.bitfield.cpumwaitx && i.operands > 0)
3864 {
3865 /* MONITORX/MWAITX instructions have fixed operands with an opcode
3866 suffix which is coded in the same place as an 8-bit immediate
3867 field would be.
3868 Here we check those operands and remove them afterwards. */
3869 unsigned int x;
3870
3871 if (i.operands != 3)
3872 abort();
3873
3874 for (x = 0; x < 2; x++)
3875 if (register_number (i.op[x].regs) != x)
3876 goto bad_register_operand;
3877
3878 /* Check for third operand for mwaitx/monitorx insn. */
3879 if (register_number (i.op[x].regs)
3880 != (x + (i.tm.extension_opcode == 0xfb)))
3881 {
3882 bad_register_operand:
3883 as_bad (_("can't use register '%s%s' as operand %d in '%s'."),
3884 register_prefix, i.op[x].regs->reg_name, x+1,
3885 i.tm.name);
3886 }
3887
3888 i.operands = 0;
3889 }
3890
3891 /* These AMD 3DNow! and SSE2 instructions have an opcode suffix
3892 which is coded in the same place as an 8-bit immediate field
3893 would be. Here we fake an 8-bit immediate operand from the
3894 opcode suffix stored in tm.extension_opcode.
3895
3896 AVX instructions also use this encoding, for some of
3897 3 argument instructions. */
3898
3899 gas_assert (i.imm_operands <= 1
3900 && (i.operands <= 2
3901 || (is_any_vex_encoding (&i.tm)
3902 && i.operands <= 4)));
3903
3904 exp = &im_expressions[i.imm_operands++];
3905 i.op[i.operands].imms = exp;
3906 i.types[i.operands] = imm8;
3907 i.operands++;
3908 exp->X_op = O_constant;
3909 exp->X_add_number = i.tm.extension_opcode;
3910 i.tm.extension_opcode = None;
3911 }
3912
3913
3914 static int
3915 check_hle (void)
3916 {
3917 switch (i.tm.opcode_modifier.hleprefixok)
3918 {
3919 default:
3920 abort ();
3921 case HLEPrefixNone:
3922 as_bad (_("invalid instruction `%s' after `%s'"),
3923 i.tm.name, i.hle_prefix);
3924 return 0;
3925 case HLEPrefixLock:
3926 if (i.prefix[LOCK_PREFIX])
3927 return 1;
3928 as_bad (_("missing `lock' with `%s'"), i.hle_prefix);
3929 return 0;
3930 case HLEPrefixAny:
3931 return 1;
3932 case HLEPrefixRelease:
3933 if (i.prefix[HLE_PREFIX] != XRELEASE_PREFIX_OPCODE)
3934 {
3935 as_bad (_("instruction `%s' after `xacquire' not allowed"),
3936 i.tm.name);
3937 return 0;
3938 }
3939 if (i.mem_operands == 0 || !(i.flags[i.operands - 1] & Operand_Mem))
3940 {
3941 as_bad (_("memory destination needed for instruction `%s'"
3942 " after `xrelease'"), i.tm.name);
3943 return 0;
3944 }
3945 return 1;
3946 }
3947 }
3948
3949 /* Try the shortest encoding by shortening operand size. */
3950
3951 static void
3952 optimize_encoding (void)
3953 {
3954 unsigned int j;
3955
3956 if (optimize_for_space
3957 && i.reg_operands == 1
3958 && i.imm_operands == 1
3959 && !i.types[1].bitfield.byte
3960 && i.op[0].imms->X_op == O_constant
3961 && fits_in_imm7 (i.op[0].imms->X_add_number)
3962 && ((i.tm.base_opcode == 0xa8
3963 && i.tm.extension_opcode == None)
3964 || (i.tm.base_opcode == 0xf6
3965 && i.tm.extension_opcode == 0x0)))
3966 {
3967 /* Optimize: -Os:
3968 test $imm7, %r64/%r32/%r16 -> test $imm7, %r8
3969 */
3970 unsigned int base_regnum = i.op[1].regs->reg_num;
3971 if (flag_code == CODE_64BIT || base_regnum < 4)
3972 {
3973 i.types[1].bitfield.byte = 1;
3974 /* Ignore the suffix. */
3975 i.suffix = 0;
3976 if (base_regnum >= 4
3977 && !(i.op[1].regs->reg_flags & RegRex))
3978 {
3979 /* Handle SP, BP, SI and DI registers. */
3980 if (i.types[1].bitfield.word)
3981 j = 16;
3982 else if (i.types[1].bitfield.dword)
3983 j = 32;
3984 else
3985 j = 48;
3986 i.op[1].regs -= j;
3987 }
3988 }
3989 }
3990 else if (flag_code == CODE_64BIT
3991 && ((i.types[1].bitfield.qword
3992 && i.reg_operands == 1
3993 && i.imm_operands == 1
3994 && i.op[0].imms->X_op == O_constant
3995 && ((i.tm.base_opcode == 0xb8
3996 && i.tm.extension_opcode == None
3997 && fits_in_unsigned_long (i.op[0].imms->X_add_number))
3998 || (fits_in_imm31 (i.op[0].imms->X_add_number)
3999 && (((i.tm.base_opcode == 0x24
4000 || i.tm.base_opcode == 0xa8)
4001 && i.tm.extension_opcode == None)
4002 || (i.tm.base_opcode == 0x80
4003 && i.tm.extension_opcode == 0x4)
4004 || ((i.tm.base_opcode == 0xf6
4005 || (i.tm.base_opcode | 1) == 0xc7)
4006 && i.tm.extension_opcode == 0x0)))
4007 || (fits_in_imm7 (i.op[0].imms->X_add_number)
4008 && i.tm.base_opcode == 0x83
4009 && i.tm.extension_opcode == 0x4)))
4010 || (i.types[0].bitfield.qword
4011 && ((i.reg_operands == 2
4012 && i.op[0].regs == i.op[1].regs
4013 && ((i.tm.base_opcode == 0x30
4014 || i.tm.base_opcode == 0x28)
4015 && i.tm.extension_opcode == None))
4016 || (i.reg_operands == 1
4017 && i.operands == 1
4018 && i.tm.base_opcode == 0x30
4019 && i.tm.extension_opcode == None)))))
4020 {
4021 /* Optimize: -O:
4022 andq $imm31, %r64 -> andl $imm31, %r32
4023 andq $imm7, %r64 -> andl $imm7, %r32
4024 testq $imm31, %r64 -> testl $imm31, %r32
4025 xorq %r64, %r64 -> xorl %r32, %r32
4026 subq %r64, %r64 -> subl %r32, %r32
4027 movq $imm31, %r64 -> movl $imm31, %r32
4028 movq $imm32, %r64 -> movl $imm32, %r32
4029 */
4030 i.tm.opcode_modifier.norex64 = 1;
4031 if (i.tm.base_opcode == 0xb8 || (i.tm.base_opcode | 1) == 0xc7)
4032 {
4033 /* Handle
4034 movq $imm31, %r64 -> movl $imm31, %r32
4035 movq $imm32, %r64 -> movl $imm32, %r32
4036 */
4037 i.tm.operand_types[0].bitfield.imm32 = 1;
4038 i.tm.operand_types[0].bitfield.imm32s = 0;
4039 i.tm.operand_types[0].bitfield.imm64 = 0;
4040 i.types[0].bitfield.imm32 = 1;
4041 i.types[0].bitfield.imm32s = 0;
4042 i.types[0].bitfield.imm64 = 0;
4043 i.types[1].bitfield.dword = 1;
4044 i.types[1].bitfield.qword = 0;
4045 if ((i.tm.base_opcode | 1) == 0xc7)
4046 {
4047 /* Handle
4048 movq $imm31, %r64 -> movl $imm31, %r32
4049 */
4050 i.tm.base_opcode = 0xb8;
4051 i.tm.extension_opcode = None;
4052 i.tm.opcode_modifier.w = 0;
4053 i.tm.opcode_modifier.shortform = 1;
4054 i.tm.opcode_modifier.modrm = 0;
4055 }
4056 }
4057 }
4058 else if (optimize > 1
4059 && !optimize_for_space
4060 && i.reg_operands == 2
4061 && i.op[0].regs == i.op[1].regs
4062 && ((i.tm.base_opcode & ~(Opcode_D | 1)) == 0x8
4063 || (i.tm.base_opcode & ~(Opcode_D | 1)) == 0x20)
4064 && (flag_code != CODE_64BIT || !i.types[0].bitfield.dword))
4065 {
4066 /* Optimize: -O2:
4067 andb %rN, %rN -> testb %rN, %rN
4068 andw %rN, %rN -> testw %rN, %rN
4069 andq %rN, %rN -> testq %rN, %rN
4070 orb %rN, %rN -> testb %rN, %rN
4071 orw %rN, %rN -> testw %rN, %rN
4072 orq %rN, %rN -> testq %rN, %rN
4073
4074 and outside of 64-bit mode
4075
4076 andl %rN, %rN -> testl %rN, %rN
4077 orl %rN, %rN -> testl %rN, %rN
4078 */
4079 i.tm.base_opcode = 0x84 | (i.tm.base_opcode & 1);
4080 }
4081 else if (i.reg_operands == 3
4082 && i.op[0].regs == i.op[1].regs
4083 && !i.types[2].bitfield.xmmword
4084 && (i.tm.opcode_modifier.vex
4085 || ((!i.mask || i.mask->zeroing)
4086 && !i.rounding
4087 && is_evex_encoding (&i.tm)
4088 && (i.vec_encoding != vex_encoding_evex
4089 || cpu_arch_isa_flags.bitfield.cpuavx512vl
4090 || i.tm.cpu_flags.bitfield.cpuavx512vl
4091 || (i.tm.operand_types[2].bitfield.zmmword
4092 && i.types[2].bitfield.ymmword))))
4093 && ((i.tm.base_opcode == 0x55
4094 || i.tm.base_opcode == 0x6655
4095 || i.tm.base_opcode == 0x66df
4096 || i.tm.base_opcode == 0x57
4097 || i.tm.base_opcode == 0x6657
4098 || i.tm.base_opcode == 0x66ef
4099 || i.tm.base_opcode == 0x66f8
4100 || i.tm.base_opcode == 0x66f9
4101 || i.tm.base_opcode == 0x66fa
4102 || i.tm.base_opcode == 0x66fb
4103 || i.tm.base_opcode == 0x42
4104 || i.tm.base_opcode == 0x6642
4105 || i.tm.base_opcode == 0x47
4106 || i.tm.base_opcode == 0x6647)
4107 && i.tm.extension_opcode == None))
4108 {
4109 /* Optimize: -O1:
4110 VOP, one of vandnps, vandnpd, vxorps, vxorpd, vpsubb, vpsubd,
4111 vpsubq and vpsubw:
4112 EVEX VOP %zmmM, %zmmM, %zmmN
4113 -> VEX VOP %xmmM, %xmmM, %xmmN (M and N < 16)
4114 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4115 EVEX VOP %ymmM, %ymmM, %ymmN
4116 -> VEX VOP %xmmM, %xmmM, %xmmN (M and N < 16)
4117 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4118 VEX VOP %ymmM, %ymmM, %ymmN
4119 -> VEX VOP %xmmM, %xmmM, %xmmN
4120 VOP, one of vpandn and vpxor:
4121 VEX VOP %ymmM, %ymmM, %ymmN
4122 -> VEX VOP %xmmM, %xmmM, %xmmN
4123 VOP, one of vpandnd and vpandnq:
4124 EVEX VOP %zmmM, %zmmM, %zmmN
4125 -> VEX vpandn %xmmM, %xmmM, %xmmN (M and N < 16)
4126 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4127 EVEX VOP %ymmM, %ymmM, %ymmN
4128 -> VEX vpandn %xmmM, %xmmM, %xmmN (M and N < 16)
4129 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4130 VOP, one of vpxord and vpxorq:
4131 EVEX VOP %zmmM, %zmmM, %zmmN
4132 -> VEX vpxor %xmmM, %xmmM, %xmmN (M and N < 16)
4133 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4134 EVEX VOP %ymmM, %ymmM, %ymmN
4135 -> VEX vpxor %xmmM, %xmmM, %xmmN (M and N < 16)
4136 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4137 VOP, one of kxord and kxorq:
4138 VEX VOP %kM, %kM, %kN
4139 -> VEX kxorw %kM, %kM, %kN
4140 VOP, one of kandnd and kandnq:
4141 VEX VOP %kM, %kM, %kN
4142 -> VEX kandnw %kM, %kM, %kN
4143 */
4144 if (is_evex_encoding (&i.tm))
4145 {
4146 if (i.vec_encoding != vex_encoding_evex)
4147 {
4148 i.tm.opcode_modifier.vex = VEX128;
4149 i.tm.opcode_modifier.vexw = VEXW0;
4150 i.tm.opcode_modifier.evex = 0;
4151 }
4152 else if (optimize > 1)
4153 i.tm.opcode_modifier.evex = EVEX128;
4154 else
4155 return;
4156 }
4157 else if (i.tm.operand_types[0].bitfield.class == RegMask)
4158 {
4159 i.tm.base_opcode &= 0xff;
4160 i.tm.opcode_modifier.vexw = VEXW0;
4161 }
4162 else
4163 i.tm.opcode_modifier.vex = VEX128;
4164
4165 if (i.tm.opcode_modifier.vex)
4166 for (j = 0; j < 3; j++)
4167 {
4168 i.types[j].bitfield.xmmword = 1;
4169 i.types[j].bitfield.ymmword = 0;
4170 }
4171 }
4172 else if (i.vec_encoding != vex_encoding_evex
4173 && !i.types[0].bitfield.zmmword
4174 && !i.types[1].bitfield.zmmword
4175 && !i.mask
4176 && !i.broadcast
4177 && is_evex_encoding (&i.tm)
4178 && ((i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0x666f
4179 || (i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf36f
4180 || (i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf26f
4181 || (i.tm.base_opcode & ~4) == 0x66db
4182 || (i.tm.base_opcode & ~4) == 0x66eb)
4183 && i.tm.extension_opcode == None)
4184 {
4185 /* Optimize: -O1:
4186 VOP, one of vmovdqa32, vmovdqa64, vmovdqu8, vmovdqu16,
4187 vmovdqu32 and vmovdqu64:
4188 EVEX VOP %xmmM, %xmmN
4189 -> VEX vmovdqa|vmovdqu %xmmM, %xmmN (M and N < 16)
4190 EVEX VOP %ymmM, %ymmN
4191 -> VEX vmovdqa|vmovdqu %ymmM, %ymmN (M and N < 16)
4192 EVEX VOP %xmmM, mem
4193 -> VEX vmovdqa|vmovdqu %xmmM, mem (M < 16)
4194 EVEX VOP %ymmM, mem
4195 -> VEX vmovdqa|vmovdqu %ymmM, mem (M < 16)
4196 EVEX VOP mem, %xmmN
4197 -> VEX mvmovdqa|vmovdquem, %xmmN (N < 16)
4198 EVEX VOP mem, %ymmN
4199 -> VEX vmovdqa|vmovdqu mem, %ymmN (N < 16)
4200 VOP, one of vpand, vpandn, vpor, vpxor:
4201 EVEX VOP{d,q} %xmmL, %xmmM, %xmmN
4202 -> VEX VOP %xmmL, %xmmM, %xmmN (L, M, and N < 16)
4203 EVEX VOP{d,q} %ymmL, %ymmM, %ymmN
4204 -> VEX VOP %ymmL, %ymmM, %ymmN (L, M, and N < 16)
4205 EVEX VOP{d,q} mem, %xmmM, %xmmN
4206 -> VEX VOP mem, %xmmM, %xmmN (M and N < 16)
4207 EVEX VOP{d,q} mem, %ymmM, %ymmN
4208 -> VEX VOP mem, %ymmM, %ymmN (M and N < 16)
4209 */
4210 for (j = 0; j < i.operands; j++)
4211 if (operand_type_check (i.types[j], disp)
4212 && i.op[j].disps->X_op == O_constant)
4213 {
4214 /* Since the VEX prefix has 2 or 3 bytes, the EVEX prefix
4215 has 4 bytes, EVEX Disp8 has 1 byte and VEX Disp32 has 4
4216 bytes, we choose EVEX Disp8 over VEX Disp32. */
4217 int evex_disp8, vex_disp8;
4218 unsigned int memshift = i.memshift;
4219 offsetT n = i.op[j].disps->X_add_number;
4220
4221 evex_disp8 = fits_in_disp8 (n);
4222 i.memshift = 0;
4223 vex_disp8 = fits_in_disp8 (n);
4224 if (evex_disp8 != vex_disp8)
4225 {
4226 i.memshift = memshift;
4227 return;
4228 }
4229
4230 i.types[j].bitfield.disp8 = vex_disp8;
4231 break;
4232 }
4233 if ((i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf26f)
4234 i.tm.base_opcode ^= 0xf36f ^ 0xf26f;
4235 i.tm.opcode_modifier.vex
4236 = i.types[0].bitfield.ymmword ? VEX256 : VEX128;
4237 i.tm.opcode_modifier.vexw = VEXW0;
4238 /* VPAND, VPOR, and VPXOR are commutative. */
4239 if (i.reg_operands == 3 && i.tm.base_opcode != 0x66df)
4240 i.tm.opcode_modifier.commutative = 1;
4241 i.tm.opcode_modifier.evex = 0;
4242 i.tm.opcode_modifier.masking = 0;
4243 i.tm.opcode_modifier.broadcast = 0;
4244 i.tm.opcode_modifier.disp8memshift = 0;
4245 i.memshift = 0;
4246 if (j < i.operands)
4247 i.types[j].bitfield.disp8
4248 = fits_in_disp8 (i.op[j].disps->X_add_number);
4249 }
4250 }
4251
4252 /* This is the guts of the machine-dependent assembler. LINE points to a
4253 machine dependent instruction. This function is supposed to emit
4254 the frags/bytes it assembles to. */
4255
4256 void
4257 md_assemble (char *line)
4258 {
4259 unsigned int j;
4260 char mnemonic[MAX_MNEM_SIZE], mnem_suffix;
4261 const insn_template *t;
4262
4263 /* Initialize globals. */
4264 memset (&i, '\0', sizeof (i));
4265 for (j = 0; j < MAX_OPERANDS; j++)
4266 i.reloc[j] = NO_RELOC;
4267 memset (disp_expressions, '\0', sizeof (disp_expressions));
4268 memset (im_expressions, '\0', sizeof (im_expressions));
4269 save_stack_p = save_stack;
4270
4271 /* First parse an instruction mnemonic & call i386_operand for the operands.
4272 We assume that the scrubber has arranged it so that line[0] is the valid
4273 start of a (possibly prefixed) mnemonic. */
4274
4275 line = parse_insn (line, mnemonic);
4276 if (line == NULL)
4277 return;
4278 mnem_suffix = i.suffix;
4279
4280 line = parse_operands (line, mnemonic);
4281 this_operand = -1;
4282 xfree (i.memop1_string);
4283 i.memop1_string = NULL;
4284 if (line == NULL)
4285 return;
4286
4287 /* Now we've parsed the mnemonic into a set of templates, and have the
4288 operands at hand. */
4289
4290 /* All intel opcodes have reversed operands except for "bound" and
4291 "enter". We also don't reverse intersegment "jmp" and "call"
4292 instructions with 2 immediate operands so that the immediate segment
4293 precedes the offset, as it does when in AT&T mode. */
4294 if (intel_syntax
4295 && i.operands > 1
4296 && (strcmp (mnemonic, "bound") != 0)
4297 && (strcmp (mnemonic, "invlpga") != 0)
4298 && !(operand_type_check (i.types[0], imm)
4299 && operand_type_check (i.types[1], imm)))
4300 swap_operands ();
4301
4302 /* The order of the immediates should be reversed
4303 for 2 immediates extrq and insertq instructions */
4304 if (i.imm_operands == 2
4305 && (strcmp (mnemonic, "extrq") == 0
4306 || strcmp (mnemonic, "insertq") == 0))
4307 swap_2_operands (0, 1);
4308
4309 if (i.imm_operands)
4310 optimize_imm ();
4311
4312 /* Don't optimize displacement for movabs since it only takes 64bit
4313 displacement. */
4314 if (i.disp_operands
4315 && i.disp_encoding != disp_encoding_32bit
4316 && (flag_code != CODE_64BIT
4317 || strcmp (mnemonic, "movabs") != 0))
4318 optimize_disp ();
4319
4320 /* Next, we find a template that matches the given insn,
4321 making sure the overlap of the given operands types is consistent
4322 with the template operand types. */
4323
4324 if (!(t = match_template (mnem_suffix)))
4325 return;
4326
4327 if (sse_check != check_none
4328 && !i.tm.opcode_modifier.noavx
4329 && !i.tm.cpu_flags.bitfield.cpuavx
4330 && (i.tm.cpu_flags.bitfield.cpusse
4331 || i.tm.cpu_flags.bitfield.cpusse2
4332 || i.tm.cpu_flags.bitfield.cpusse3
4333 || i.tm.cpu_flags.bitfield.cpussse3
4334 || i.tm.cpu_flags.bitfield.cpusse4_1
4335 || i.tm.cpu_flags.bitfield.cpusse4_2
4336 || i.tm.cpu_flags.bitfield.cpupclmul
4337 || i.tm.cpu_flags.bitfield.cpuaes
4338 || i.tm.cpu_flags.bitfield.cpugfni))
4339 {
4340 (sse_check == check_warning
4341 ? as_warn
4342 : as_bad) (_("SSE instruction `%s' is used"), i.tm.name);
4343 }
4344
4345 /* Zap movzx and movsx suffix. The suffix has been set from
4346 "word ptr" or "byte ptr" on the source operand in Intel syntax
4347 or extracted from mnemonic in AT&T syntax. But we'll use
4348 the destination register to choose the suffix for encoding. */
4349 if ((i.tm.base_opcode & ~9) == 0x0fb6)
4350 {
4351 /* In Intel syntax, there must be a suffix. In AT&T syntax, if
4352 there is no suffix, the default will be byte extension. */
4353 if (i.reg_operands != 2
4354 && !i.suffix
4355 && intel_syntax)
4356 as_bad (_("ambiguous operand size for `%s'"), i.tm.name);
4357
4358 i.suffix = 0;
4359 }
4360
4361 if (i.tm.opcode_modifier.fwait)
4362 if (!add_prefix (FWAIT_OPCODE))
4363 return;
4364
4365 /* Check if REP prefix is OK. */
4366 if (i.rep_prefix && !i.tm.opcode_modifier.repprefixok)
4367 {
4368 as_bad (_("invalid instruction `%s' after `%s'"),
4369 i.tm.name, i.rep_prefix);
4370 return;
4371 }
4372
4373 /* Check for lock without a lockable instruction. Destination operand
4374 must be memory unless it is xchg (0x86). */
4375 if (i.prefix[LOCK_PREFIX]
4376 && (!i.tm.opcode_modifier.islockable
4377 || i.mem_operands == 0
4378 || (i.tm.base_opcode != 0x86
4379 && !(i.flags[i.operands - 1] & Operand_Mem))))
4380 {
4381 as_bad (_("expecting lockable instruction after `lock'"));
4382 return;
4383 }
4384
4385 /* Check for data size prefix on VEX/XOP/EVEX encoded insns. */
4386 if (i.prefix[DATA_PREFIX] && is_any_vex_encoding (&i.tm))
4387 {
4388 as_bad (_("data size prefix invalid with `%s'"), i.tm.name);
4389 return;
4390 }
4391
4392 /* Check if HLE prefix is OK. */
4393 if (i.hle_prefix && !check_hle ())
4394 return;
4395
4396 /* Check BND prefix. */
4397 if (i.bnd_prefix && !i.tm.opcode_modifier.bndprefixok)
4398 as_bad (_("expecting valid branch instruction after `bnd'"));
4399
4400 /* Check NOTRACK prefix. */
4401 if (i.notrack_prefix && !i.tm.opcode_modifier.notrackprefixok)
4402 as_bad (_("expecting indirect branch instruction after `notrack'"));
4403
4404 if (i.tm.cpu_flags.bitfield.cpumpx)
4405 {
4406 if (flag_code == CODE_64BIT && i.prefix[ADDR_PREFIX])
4407 as_bad (_("32-bit address isn't allowed in 64-bit MPX instructions."));
4408 else if (flag_code != CODE_16BIT
4409 ? i.prefix[ADDR_PREFIX]
4410 : i.mem_operands && !i.prefix[ADDR_PREFIX])
4411 as_bad (_("16-bit address isn't allowed in MPX instructions"));
4412 }
4413
4414 /* Insert BND prefix. */
4415 if (add_bnd_prefix && i.tm.opcode_modifier.bndprefixok)
4416 {
4417 if (!i.prefix[BND_PREFIX])
4418 add_prefix (BND_PREFIX_OPCODE);
4419 else if (i.prefix[BND_PREFIX] != BND_PREFIX_OPCODE)
4420 {
4421 as_warn (_("replacing `rep'/`repe' prefix by `bnd'"));
4422 i.prefix[BND_PREFIX] = BND_PREFIX_OPCODE;
4423 }
4424 }
4425
4426 /* Check string instruction segment overrides. */
4427 if (i.tm.opcode_modifier.isstring && i.mem_operands != 0)
4428 {
4429 if (!check_string ())
4430 return;
4431 i.disp_operands = 0;
4432 }
4433
4434 if (optimize && !i.no_optimize && i.tm.opcode_modifier.optimize)
4435 optimize_encoding ();
4436
4437 if (!process_suffix ())
4438 return;
4439
4440 /* Update operand types. */
4441 for (j = 0; j < i.operands; j++)
4442 i.types[j] = operand_type_and (i.types[j], i.tm.operand_types[j]);
4443
4444 /* Make still unresolved immediate matches conform to size of immediate
4445 given in i.suffix. */
4446 if (!finalize_imm ())
4447 return;
4448
4449 if (i.types[0].bitfield.imm1)
4450 i.imm_operands = 0; /* kludge for shift insns. */
4451
4452 /* We only need to check those implicit registers for instructions
4453 with 3 operands or less. */
4454 if (i.operands <= 3)
4455 for (j = 0; j < i.operands; j++)
4456 if (i.types[j].bitfield.inoutportreg
4457 || i.types[j].bitfield.shiftcount
4458 || (i.types[j].bitfield.acc && !i.types[j].bitfield.xmmword))
4459 i.reg_operands--;
4460
4461 /* ImmExt should be processed after SSE2AVX. */
4462 if (!i.tm.opcode_modifier.sse2avx
4463 && i.tm.opcode_modifier.immext)
4464 process_immext ();
4465
4466 /* For insns with operands there are more diddles to do to the opcode. */
4467 if (i.operands)
4468 {
4469 if (!process_operands ())
4470 return;
4471 }
4472 else if (!quiet_warnings && i.tm.opcode_modifier.ugh)
4473 {
4474 /* UnixWare fsub no args is alias for fsubp, fadd -> faddp, etc. */
4475 as_warn (_("translating to `%sp'"), i.tm.name);
4476 }
4477
4478 if (is_any_vex_encoding (&i.tm))
4479 {
4480 if (!cpu_arch_flags.bitfield.cpui286)
4481 {
4482 as_bad (_("instruction `%s' isn't supported outside of protected mode."),
4483 i.tm.name);
4484 return;
4485 }
4486
4487 if (i.tm.opcode_modifier.vex)
4488 build_vex_prefix (t);
4489 else
4490 build_evex_prefix ();
4491 }
4492
4493 /* Handle conversion of 'int $3' --> special int3 insn. XOP or FMA4
4494 instructions may define INT_OPCODE as well, so avoid this corner
4495 case for those instructions that use MODRM. */
4496 if (i.tm.base_opcode == INT_OPCODE
4497 && !i.tm.opcode_modifier.modrm
4498 && i.op[0].imms->X_add_number == 3)
4499 {
4500 i.tm.base_opcode = INT3_OPCODE;
4501 i.imm_operands = 0;
4502 }
4503
4504 if ((i.tm.opcode_modifier.jump
4505 || i.tm.opcode_modifier.jumpbyte
4506 || i.tm.opcode_modifier.jumpdword)
4507 && i.op[0].disps->X_op == O_constant)
4508 {
4509 /* Convert "jmp constant" (and "call constant") to a jump (call) to
4510 the absolute address given by the constant. Since ix86 jumps and
4511 calls are pc relative, we need to generate a reloc. */
4512 i.op[0].disps->X_add_symbol = &abs_symbol;
4513 i.op[0].disps->X_op = O_symbol;
4514 }
4515
4516 if (i.tm.opcode_modifier.rex64)
4517 i.rex |= REX_W;
4518
4519 /* For 8 bit registers we need an empty rex prefix. Also if the
4520 instruction already has a prefix, we need to convert old
4521 registers to new ones. */
4522
4523 if ((i.types[0].bitfield.class == Reg && i.types[0].bitfield.byte
4524 && (i.op[0].regs->reg_flags & RegRex64) != 0)
4525 || (i.types[1].bitfield.class == Reg && i.types[1].bitfield.byte
4526 && (i.op[1].regs->reg_flags & RegRex64) != 0)
4527 || (((i.types[0].bitfield.class == Reg && i.types[0].bitfield.byte)
4528 || (i.types[1].bitfield.class == Reg && i.types[1].bitfield.byte))
4529 && i.rex != 0))
4530 {
4531 int x;
4532
4533 i.rex |= REX_OPCODE;
4534 for (x = 0; x < 2; x++)
4535 {
4536 /* Look for 8 bit operand that uses old registers. */
4537 if (i.types[x].bitfield.class == Reg && i.types[x].bitfield.byte
4538 && (i.op[x].regs->reg_flags & RegRex64) == 0)
4539 {
4540 /* In case it is "hi" register, give up. */
4541 if (i.op[x].regs->reg_num > 3)
4542 as_bad (_("can't encode register '%s%s' in an "
4543 "instruction requiring REX prefix."),
4544 register_prefix, i.op[x].regs->reg_name);
4545
4546 /* Otherwise it is equivalent to the extended register.
4547 Since the encoding doesn't change this is merely
4548 cosmetic cleanup for debug output. */
4549
4550 i.op[x].regs = i.op[x].regs + 8;
4551 }
4552 }
4553 }
4554
4555 if (i.rex == 0 && i.rex_encoding)
4556 {
4557 /* Check if we can add a REX_OPCODE byte. Look for 8 bit operand
4558 that uses legacy register. If it is "hi" register, don't add
4559 the REX_OPCODE byte. */
4560 int x;
4561 for (x = 0; x < 2; x++)
4562 if (i.types[x].bitfield.class == Reg
4563 && i.types[x].bitfield.byte
4564 && (i.op[x].regs->reg_flags & RegRex64) == 0
4565 && i.op[x].regs->reg_num > 3)
4566 {
4567 i.rex_encoding = FALSE;
4568 break;
4569 }
4570
4571 if (i.rex_encoding)
4572 i.rex = REX_OPCODE;
4573 }
4574
4575 if (i.rex != 0)
4576 add_prefix (REX_OPCODE | i.rex);
4577
4578 /* We are ready to output the insn. */
4579 output_insn ();
4580 }
4581
4582 static char *
4583 parse_insn (char *line, char *mnemonic)
4584 {
4585 char *l = line;
4586 char *token_start = l;
4587 char *mnem_p;
4588 int supported;
4589 const insn_template *t;
4590 char *dot_p = NULL;
4591
4592 while (1)
4593 {
4594 mnem_p = mnemonic;
4595 while ((*mnem_p = mnemonic_chars[(unsigned char) *l]) != 0)
4596 {
4597 if (*mnem_p == '.')
4598 dot_p = mnem_p;
4599 mnem_p++;
4600 if (mnem_p >= mnemonic + MAX_MNEM_SIZE)
4601 {
4602 as_bad (_("no such instruction: `%s'"), token_start);
4603 return NULL;
4604 }
4605 l++;
4606 }
4607 if (!is_space_char (*l)
4608 && *l != END_OF_INSN
4609 && (intel_syntax
4610 || (*l != PREFIX_SEPARATOR
4611 && *l != ',')))
4612 {
4613 as_bad (_("invalid character %s in mnemonic"),
4614 output_invalid (*l));
4615 return NULL;
4616 }
4617 if (token_start == l)
4618 {
4619 if (!intel_syntax && *l == PREFIX_SEPARATOR)
4620 as_bad (_("expecting prefix; got nothing"));
4621 else
4622 as_bad (_("expecting mnemonic; got nothing"));
4623 return NULL;
4624 }
4625
4626 /* Look up instruction (or prefix) via hash table. */
4627 current_templates = (const templates *) hash_find (op_hash, mnemonic);
4628
4629 if (*l != END_OF_INSN
4630 && (!is_space_char (*l) || l[1] != END_OF_INSN)
4631 && current_templates
4632 && current_templates->start->opcode_modifier.isprefix)
4633 {
4634 if (!cpu_flags_check_cpu64 (current_templates->start->cpu_flags))
4635 {
4636 as_bad ((flag_code != CODE_64BIT
4637 ? _("`%s' is only supported in 64-bit mode")
4638 : _("`%s' is not supported in 64-bit mode")),
4639 current_templates->start->name);
4640 return NULL;
4641 }
4642 /* If we are in 16-bit mode, do not allow addr16 or data16.
4643 Similarly, in 32-bit mode, do not allow addr32 or data32. */
4644 if ((current_templates->start->opcode_modifier.size == SIZE16
4645 || current_templates->start->opcode_modifier.size == SIZE32)
4646 && flag_code != CODE_64BIT
4647 && ((current_templates->start->opcode_modifier.size == SIZE32)
4648 ^ (flag_code == CODE_16BIT)))
4649 {
4650 as_bad (_("redundant %s prefix"),
4651 current_templates->start->name);
4652 return NULL;
4653 }
4654 if (current_templates->start->opcode_length == 0)
4655 {
4656 /* Handle pseudo prefixes. */
4657 switch (current_templates->start->base_opcode)
4658 {
4659 case 0x0:
4660 /* {disp8} */
4661 i.disp_encoding = disp_encoding_8bit;
4662 break;
4663 case 0x1:
4664 /* {disp32} */
4665 i.disp_encoding = disp_encoding_32bit;
4666 break;
4667 case 0x2:
4668 /* {load} */
4669 i.dir_encoding = dir_encoding_load;
4670 break;
4671 case 0x3:
4672 /* {store} */
4673 i.dir_encoding = dir_encoding_store;
4674 break;
4675 case 0x4:
4676 /* {vex2} */
4677 i.vec_encoding = vex_encoding_vex2;
4678 break;
4679 case 0x5:
4680 /* {vex3} */
4681 i.vec_encoding = vex_encoding_vex3;
4682 break;
4683 case 0x6:
4684 /* {evex} */
4685 i.vec_encoding = vex_encoding_evex;
4686 break;
4687 case 0x7:
4688 /* {rex} */
4689 i.rex_encoding = TRUE;
4690 break;
4691 case 0x8:
4692 /* {nooptimize} */
4693 i.no_optimize = TRUE;
4694 break;
4695 default:
4696 abort ();
4697 }
4698 }
4699 else
4700 {
4701 /* Add prefix, checking for repeated prefixes. */
4702 switch (add_prefix (current_templates->start->base_opcode))
4703 {
4704 case PREFIX_EXIST:
4705 return NULL;
4706 case PREFIX_DS:
4707 if (current_templates->start->cpu_flags.bitfield.cpuibt)
4708 i.notrack_prefix = current_templates->start->name;
4709 break;
4710 case PREFIX_REP:
4711 if (current_templates->start->cpu_flags.bitfield.cpuhle)
4712 i.hle_prefix = current_templates->start->name;
4713 else if (current_templates->start->cpu_flags.bitfield.cpumpx)
4714 i.bnd_prefix = current_templates->start->name;
4715 else
4716 i.rep_prefix = current_templates->start->name;
4717 break;
4718 default:
4719 break;
4720 }
4721 }
4722 /* Skip past PREFIX_SEPARATOR and reset token_start. */
4723 token_start = ++l;
4724 }
4725 else
4726 break;
4727 }
4728
4729 if (!current_templates)
4730 {
4731 /* Deprecated functionality (new code should use pseudo-prefixes instead):
4732 Check if we should swap operand or force 32bit displacement in
4733 encoding. */
4734 if (mnem_p - 2 == dot_p && dot_p[1] == 's')
4735 i.dir_encoding = dir_encoding_swap;
4736 else if (mnem_p - 3 == dot_p
4737 && dot_p[1] == 'd'
4738 && dot_p[2] == '8')
4739 i.disp_encoding = disp_encoding_8bit;
4740 else if (mnem_p - 4 == dot_p
4741 && dot_p[1] == 'd'
4742 && dot_p[2] == '3'
4743 && dot_p[3] == '2')
4744 i.disp_encoding = disp_encoding_32bit;
4745 else
4746 goto check_suffix;
4747 mnem_p = dot_p;
4748 *dot_p = '\0';
4749 current_templates = (const templates *) hash_find (op_hash, mnemonic);
4750 }
4751
4752 if (!current_templates)
4753 {
4754 check_suffix:
4755 if (mnem_p > mnemonic)
4756 {
4757 /* See if we can get a match by trimming off a suffix. */
4758 switch (mnem_p[-1])
4759 {
4760 case WORD_MNEM_SUFFIX:
4761 if (intel_syntax && (intel_float_operand (mnemonic) & 2))
4762 i.suffix = SHORT_MNEM_SUFFIX;
4763 else
4764 /* Fall through. */
4765 case BYTE_MNEM_SUFFIX:
4766 case QWORD_MNEM_SUFFIX:
4767 i.suffix = mnem_p[-1];
4768 mnem_p[-1] = '\0';
4769 current_templates = (const templates *) hash_find (op_hash,
4770 mnemonic);
4771 break;
4772 case SHORT_MNEM_SUFFIX:
4773 case LONG_MNEM_SUFFIX:
4774 if (!intel_syntax)
4775 {
4776 i.suffix = mnem_p[-1];
4777 mnem_p[-1] = '\0';
4778 current_templates = (const templates *) hash_find (op_hash,
4779 mnemonic);
4780 }
4781 break;
4782
4783 /* Intel Syntax. */
4784 case 'd':
4785 if (intel_syntax)
4786 {
4787 if (intel_float_operand (mnemonic) == 1)
4788 i.suffix = SHORT_MNEM_SUFFIX;
4789 else
4790 i.suffix = LONG_MNEM_SUFFIX;
4791 mnem_p[-1] = '\0';
4792 current_templates = (const templates *) hash_find (op_hash,
4793 mnemonic);
4794 }
4795 break;
4796 }
4797 }
4798
4799 if (!current_templates)
4800 {
4801 as_bad (_("no such instruction: `%s'"), token_start);
4802 return NULL;
4803 }
4804 }
4805
4806 if (current_templates->start->opcode_modifier.jump
4807 || current_templates->start->opcode_modifier.jumpbyte)
4808 {
4809 /* Check for a branch hint. We allow ",pt" and ",pn" for
4810 predict taken and predict not taken respectively.
4811 I'm not sure that branch hints actually do anything on loop
4812 and jcxz insns (JumpByte) for current Pentium4 chips. They
4813 may work in the future and it doesn't hurt to accept them
4814 now. */
4815 if (l[0] == ',' && l[1] == 'p')
4816 {
4817 if (l[2] == 't')
4818 {
4819 if (!add_prefix (DS_PREFIX_OPCODE))
4820 return NULL;
4821 l += 3;
4822 }
4823 else if (l[2] == 'n')
4824 {
4825 if (!add_prefix (CS_PREFIX_OPCODE))
4826 return NULL;
4827 l += 3;
4828 }
4829 }
4830 }
4831 /* Any other comma loses. */
4832 if (*l == ',')
4833 {
4834 as_bad (_("invalid character %s in mnemonic"),
4835 output_invalid (*l));
4836 return NULL;
4837 }
4838
4839 /* Check if instruction is supported on specified architecture. */
4840 supported = 0;
4841 for (t = current_templates->start; t < current_templates->end; ++t)
4842 {
4843 supported |= cpu_flags_match (t);
4844 if (supported == CPU_FLAGS_PERFECT_MATCH)
4845 {
4846 if (!cpu_arch_flags.bitfield.cpui386 && (flag_code != CODE_16BIT))
4847 as_warn (_("use .code16 to ensure correct addressing mode"));
4848
4849 return l;
4850 }
4851 }
4852
4853 if (!(supported & CPU_FLAGS_64BIT_MATCH))
4854 as_bad (flag_code == CODE_64BIT
4855 ? _("`%s' is not supported in 64-bit mode")
4856 : _("`%s' is only supported in 64-bit mode"),
4857 current_templates->start->name);
4858 else
4859 as_bad (_("`%s' is not supported on `%s%s'"),
4860 current_templates->start->name,
4861 cpu_arch_name ? cpu_arch_name : default_arch,
4862 cpu_sub_arch_name ? cpu_sub_arch_name : "");
4863
4864 return NULL;
4865 }
4866
4867 static char *
4868 parse_operands (char *l, const char *mnemonic)
4869 {
4870 char *token_start;
4871
4872 /* 1 if operand is pending after ','. */
4873 unsigned int expecting_operand = 0;
4874
4875 /* Non-zero if operand parens not balanced. */
4876 unsigned int paren_not_balanced;
4877
4878 while (*l != END_OF_INSN)
4879 {
4880 /* Skip optional white space before operand. */
4881 if (is_space_char (*l))
4882 ++l;
4883 if (!is_operand_char (*l) && *l != END_OF_INSN && *l != '"')
4884 {
4885 as_bad (_("invalid character %s before operand %d"),
4886 output_invalid (*l),
4887 i.operands + 1);
4888 return NULL;
4889 }
4890 token_start = l; /* After white space. */
4891 paren_not_balanced = 0;
4892 while (paren_not_balanced || *l != ',')
4893 {
4894 if (*l == END_OF_INSN)
4895 {
4896 if (paren_not_balanced)
4897 {
4898 if (!intel_syntax)
4899 as_bad (_("unbalanced parenthesis in operand %d."),
4900 i.operands + 1);
4901 else
4902 as_bad (_("unbalanced brackets in operand %d."),
4903 i.operands + 1);
4904 return NULL;
4905 }
4906 else
4907 break; /* we are done */
4908 }
4909 else if (!is_operand_char (*l) && !is_space_char (*l) && *l != '"')
4910 {
4911 as_bad (_("invalid character %s in operand %d"),
4912 output_invalid (*l),
4913 i.operands + 1);
4914 return NULL;
4915 }
4916 if (!intel_syntax)
4917 {
4918 if (*l == '(')
4919 ++paren_not_balanced;
4920 if (*l == ')')
4921 --paren_not_balanced;
4922 }
4923 else
4924 {
4925 if (*l == '[')
4926 ++paren_not_balanced;
4927 if (*l == ']')
4928 --paren_not_balanced;
4929 }
4930 l++;
4931 }
4932 if (l != token_start)
4933 { /* Yes, we've read in another operand. */
4934 unsigned int operand_ok;
4935 this_operand = i.operands++;
4936 if (i.operands > MAX_OPERANDS)
4937 {
4938 as_bad (_("spurious operands; (%d operands/instruction max)"),
4939 MAX_OPERANDS);
4940 return NULL;
4941 }
4942 i.types[this_operand].bitfield.unspecified = 1;
4943 /* Now parse operand adding info to 'i' as we go along. */
4944 END_STRING_AND_SAVE (l);
4945
4946 if (i.mem_operands > 1)
4947 {
4948 as_bad (_("too many memory references for `%s'"),
4949 mnemonic);
4950 return 0;
4951 }
4952
4953 if (intel_syntax)
4954 operand_ok =
4955 i386_intel_operand (token_start,
4956 intel_float_operand (mnemonic));
4957 else
4958 operand_ok = i386_att_operand (token_start);
4959
4960 RESTORE_END_STRING (l);
4961 if (!operand_ok)
4962 return NULL;
4963 }
4964 else
4965 {
4966 if (expecting_operand)
4967 {
4968 expecting_operand_after_comma:
4969 as_bad (_("expecting operand after ','; got nothing"));
4970 return NULL;
4971 }
4972 if (*l == ',')
4973 {
4974 as_bad (_("expecting operand before ','; got nothing"));
4975 return NULL;
4976 }
4977 }
4978
4979 /* Now *l must be either ',' or END_OF_INSN. */
4980 if (*l == ',')
4981 {
4982 if (*++l == END_OF_INSN)
4983 {
4984 /* Just skip it, if it's \n complain. */
4985 goto expecting_operand_after_comma;
4986 }
4987 expecting_operand = 1;
4988 }
4989 }
4990 return l;
4991 }
4992
4993 static void
4994 swap_2_operands (int xchg1, int xchg2)
4995 {
4996 union i386_op temp_op;
4997 i386_operand_type temp_type;
4998 unsigned int temp_flags;
4999 enum bfd_reloc_code_real temp_reloc;
5000
5001 temp_type = i.types[xchg2];
5002 i.types[xchg2] = i.types[xchg1];
5003 i.types[xchg1] = temp_type;
5004
5005 temp_flags = i.flags[xchg2];
5006 i.flags[xchg2] = i.flags[xchg1];
5007 i.flags[xchg1] = temp_flags;
5008
5009 temp_op = i.op[xchg2];
5010 i.op[xchg2] = i.op[xchg1];
5011 i.op[xchg1] = temp_op;
5012
5013 temp_reloc = i.reloc[xchg2];
5014 i.reloc[xchg2] = i.reloc[xchg1];
5015 i.reloc[xchg1] = temp_reloc;
5016
5017 if (i.mask)
5018 {
5019 if (i.mask->operand == xchg1)
5020 i.mask->operand = xchg2;
5021 else if (i.mask->operand == xchg2)
5022 i.mask->operand = xchg1;
5023 }
5024 if (i.broadcast)
5025 {
5026 if (i.broadcast->operand == xchg1)
5027 i.broadcast->operand = xchg2;
5028 else if (i.broadcast->operand == xchg2)
5029 i.broadcast->operand = xchg1;
5030 }
5031 if (i.rounding)
5032 {
5033 if (i.rounding->operand == xchg1)
5034 i.rounding->operand = xchg2;
5035 else if (i.rounding->operand == xchg2)
5036 i.rounding->operand = xchg1;
5037 }
5038 }
5039
5040 static void
5041 swap_operands (void)
5042 {
5043 switch (i.operands)
5044 {
5045 case 5:
5046 case 4:
5047 swap_2_operands (1, i.operands - 2);
5048 /* Fall through. */
5049 case 3:
5050 case 2:
5051 swap_2_operands (0, i.operands - 1);
5052 break;
5053 default:
5054 abort ();
5055 }
5056
5057 if (i.mem_operands == 2)
5058 {
5059 const seg_entry *temp_seg;
5060 temp_seg = i.seg[0];
5061 i.seg[0] = i.seg[1];
5062 i.seg[1] = temp_seg;
5063 }
5064 }
5065
5066 /* Try to ensure constant immediates are represented in the smallest
5067 opcode possible. */
5068 static void
5069 optimize_imm (void)
5070 {
5071 char guess_suffix = 0;
5072 int op;
5073
5074 if (i.suffix)
5075 guess_suffix = i.suffix;
5076 else if (i.reg_operands)
5077 {
5078 /* Figure out a suffix from the last register operand specified.
5079 We can't do this properly yet, ie. excluding InOutPortReg,
5080 but the following works for instructions with immediates.
5081 In any case, we can't set i.suffix yet. */
5082 for (op = i.operands; --op >= 0;)
5083 if (i.types[op].bitfield.class != Reg)
5084 continue;
5085 else if (i.types[op].bitfield.byte)
5086 {
5087 guess_suffix = BYTE_MNEM_SUFFIX;
5088 break;
5089 }
5090 else if (i.types[op].bitfield.word)
5091 {
5092 guess_suffix = WORD_MNEM_SUFFIX;
5093 break;
5094 }
5095 else if (i.types[op].bitfield.dword)
5096 {
5097 guess_suffix = LONG_MNEM_SUFFIX;
5098 break;
5099 }
5100 else if (i.types[op].bitfield.qword)
5101 {
5102 guess_suffix = QWORD_MNEM_SUFFIX;
5103 break;
5104 }
5105 }
5106 else if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
5107 guess_suffix = WORD_MNEM_SUFFIX;
5108
5109 for (op = i.operands; --op >= 0;)
5110 if (operand_type_check (i.types[op], imm))
5111 {
5112 switch (i.op[op].imms->X_op)
5113 {
5114 case O_constant:
5115 /* If a suffix is given, this operand may be shortened. */
5116 switch (guess_suffix)
5117 {
5118 case LONG_MNEM_SUFFIX:
5119 i.types[op].bitfield.imm32 = 1;
5120 i.types[op].bitfield.imm64 = 1;
5121 break;
5122 case WORD_MNEM_SUFFIX:
5123 i.types[op].bitfield.imm16 = 1;
5124 i.types[op].bitfield.imm32 = 1;
5125 i.types[op].bitfield.imm32s = 1;
5126 i.types[op].bitfield.imm64 = 1;
5127 break;
5128 case BYTE_MNEM_SUFFIX:
5129 i.types[op].bitfield.imm8 = 1;
5130 i.types[op].bitfield.imm8s = 1;
5131 i.types[op].bitfield.imm16 = 1;
5132 i.types[op].bitfield.imm32 = 1;
5133 i.types[op].bitfield.imm32s = 1;
5134 i.types[op].bitfield.imm64 = 1;
5135 break;
5136 }
5137
5138 /* If this operand is at most 16 bits, convert it
5139 to a signed 16 bit number before trying to see
5140 whether it will fit in an even smaller size.
5141 This allows a 16-bit operand such as $0xffe0 to
5142 be recognised as within Imm8S range. */
5143 if ((i.types[op].bitfield.imm16)
5144 && (i.op[op].imms->X_add_number & ~(offsetT) 0xffff) == 0)
5145 {
5146 i.op[op].imms->X_add_number =
5147 (((i.op[op].imms->X_add_number & 0xffff) ^ 0x8000) - 0x8000);
5148 }
5149 #ifdef BFD64
5150 /* Store 32-bit immediate in 64-bit for 64-bit BFD. */
5151 if ((i.types[op].bitfield.imm32)
5152 && ((i.op[op].imms->X_add_number & ~(((offsetT) 2 << 31) - 1))
5153 == 0))
5154 {
5155 i.op[op].imms->X_add_number = ((i.op[op].imms->X_add_number
5156 ^ ((offsetT) 1 << 31))
5157 - ((offsetT) 1 << 31));
5158 }
5159 #endif
5160 i.types[op]
5161 = operand_type_or (i.types[op],
5162 smallest_imm_type (i.op[op].imms->X_add_number));
5163
5164 /* We must avoid matching of Imm32 templates when 64bit
5165 only immediate is available. */
5166 if (guess_suffix == QWORD_MNEM_SUFFIX)
5167 i.types[op].bitfield.imm32 = 0;
5168 break;
5169
5170 case O_absent:
5171 case O_register:
5172 abort ();
5173
5174 /* Symbols and expressions. */
5175 default:
5176 /* Convert symbolic operand to proper sizes for matching, but don't
5177 prevent matching a set of insns that only supports sizes other
5178 than those matching the insn suffix. */
5179 {
5180 i386_operand_type mask, allowed;
5181 const insn_template *t;
5182
5183 operand_type_set (&mask, 0);
5184 operand_type_set (&allowed, 0);
5185
5186 for (t = current_templates->start;
5187 t < current_templates->end;
5188 ++t)
5189 {
5190 allowed = operand_type_or (allowed, t->operand_types[op]);
5191 allowed = operand_type_and (allowed, anyimm);
5192 }
5193 switch (guess_suffix)
5194 {
5195 case QWORD_MNEM_SUFFIX:
5196 mask.bitfield.imm64 = 1;
5197 mask.bitfield.imm32s = 1;
5198 break;
5199 case LONG_MNEM_SUFFIX:
5200 mask.bitfield.imm32 = 1;
5201 break;
5202 case WORD_MNEM_SUFFIX:
5203 mask.bitfield.imm16 = 1;
5204 break;
5205 case BYTE_MNEM_SUFFIX:
5206 mask.bitfield.imm8 = 1;
5207 break;
5208 default:
5209 break;
5210 }
5211 allowed = operand_type_and (mask, allowed);
5212 if (!operand_type_all_zero (&allowed))
5213 i.types[op] = operand_type_and (i.types[op], mask);
5214 }
5215 break;
5216 }
5217 }
5218 }
5219
5220 /* Try to use the smallest displacement type too. */
5221 static void
5222 optimize_disp (void)
5223 {
5224 int op;
5225
5226 for (op = i.operands; --op >= 0;)
5227 if (operand_type_check (i.types[op], disp))
5228 {
5229 if (i.op[op].disps->X_op == O_constant)
5230 {
5231 offsetT op_disp = i.op[op].disps->X_add_number;
5232
5233 if (i.types[op].bitfield.disp16
5234 && (op_disp & ~(offsetT) 0xffff) == 0)
5235 {
5236 /* If this operand is at most 16 bits, convert
5237 to a signed 16 bit number and don't use 64bit
5238 displacement. */
5239 op_disp = (((op_disp & 0xffff) ^ 0x8000) - 0x8000);
5240 i.types[op].bitfield.disp64 = 0;
5241 }
5242 #ifdef BFD64
5243 /* Optimize 64-bit displacement to 32-bit for 64-bit BFD. */
5244 if (i.types[op].bitfield.disp32
5245 && (op_disp & ~(((offsetT) 2 << 31) - 1)) == 0)
5246 {
5247 /* If this operand is at most 32 bits, convert
5248 to a signed 32 bit number and don't use 64bit
5249 displacement. */
5250 op_disp &= (((offsetT) 2 << 31) - 1);
5251 op_disp = (op_disp ^ ((offsetT) 1 << 31)) - ((addressT) 1 << 31);
5252 i.types[op].bitfield.disp64 = 0;
5253 }
5254 #endif
5255 if (!op_disp && i.types[op].bitfield.baseindex)
5256 {
5257 i.types[op].bitfield.disp8 = 0;
5258 i.types[op].bitfield.disp16 = 0;
5259 i.types[op].bitfield.disp32 = 0;
5260 i.types[op].bitfield.disp32s = 0;
5261 i.types[op].bitfield.disp64 = 0;
5262 i.op[op].disps = 0;
5263 i.disp_operands--;
5264 }
5265 else if (flag_code == CODE_64BIT)
5266 {
5267 if (fits_in_signed_long (op_disp))
5268 {
5269 i.types[op].bitfield.disp64 = 0;
5270 i.types[op].bitfield.disp32s = 1;
5271 }
5272 if (i.prefix[ADDR_PREFIX]
5273 && fits_in_unsigned_long (op_disp))
5274 i.types[op].bitfield.disp32 = 1;
5275 }
5276 if ((i.types[op].bitfield.disp32
5277 || i.types[op].bitfield.disp32s
5278 || i.types[op].bitfield.disp16)
5279 && fits_in_disp8 (op_disp))
5280 i.types[op].bitfield.disp8 = 1;
5281 }
5282 else if (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
5283 || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL)
5284 {
5285 fix_new_exp (frag_now, frag_more (0) - frag_now->fr_literal, 0,
5286 i.op[op].disps, 0, i.reloc[op]);
5287 i.types[op].bitfield.disp8 = 0;
5288 i.types[op].bitfield.disp16 = 0;
5289 i.types[op].bitfield.disp32 = 0;
5290 i.types[op].bitfield.disp32s = 0;
5291 i.types[op].bitfield.disp64 = 0;
5292 }
5293 else
5294 /* We only support 64bit displacement on constants. */
5295 i.types[op].bitfield.disp64 = 0;
5296 }
5297 }
5298
5299 /* Return 1 if there is a match in broadcast bytes between operand
5300 GIVEN and instruction template T. */
5301
5302 static INLINE int
5303 match_broadcast_size (const insn_template *t, unsigned int given)
5304 {
5305 return ((t->opcode_modifier.broadcast == BYTE_BROADCAST
5306 && i.types[given].bitfield.byte)
5307 || (t->opcode_modifier.broadcast == WORD_BROADCAST
5308 && i.types[given].bitfield.word)
5309 || (t->opcode_modifier.broadcast == DWORD_BROADCAST
5310 && i.types[given].bitfield.dword)
5311 || (t->opcode_modifier.broadcast == QWORD_BROADCAST
5312 && i.types[given].bitfield.qword));
5313 }
5314
5315 /* Check if operands are valid for the instruction. */
5316
5317 static int
5318 check_VecOperands (const insn_template *t)
5319 {
5320 unsigned int op;
5321 i386_cpu_flags cpu;
5322 static const i386_cpu_flags avx512 = CPU_ANY_AVX512F_FLAGS;
5323
5324 /* Templates allowing for ZMMword as well as YMMword and/or XMMword for
5325 any one operand are implicity requiring AVX512VL support if the actual
5326 operand size is YMMword or XMMword. Since this function runs after
5327 template matching, there's no need to check for YMMword/XMMword in
5328 the template. */
5329 cpu = cpu_flags_and (t->cpu_flags, avx512);
5330 if (!cpu_flags_all_zero (&cpu)
5331 && !t->cpu_flags.bitfield.cpuavx512vl
5332 && !cpu_arch_flags.bitfield.cpuavx512vl)
5333 {
5334 for (op = 0; op < t->operands; ++op)
5335 {
5336 if (t->operand_types[op].bitfield.zmmword
5337 && (i.types[op].bitfield.ymmword
5338 || i.types[op].bitfield.xmmword))
5339 {
5340 i.error = unsupported;
5341 return 1;
5342 }
5343 }
5344 }
5345
5346 /* Without VSIB byte, we can't have a vector register for index. */
5347 if (!t->opcode_modifier.vecsib
5348 && i.index_reg
5349 && (i.index_reg->reg_type.bitfield.xmmword
5350 || i.index_reg->reg_type.bitfield.ymmword
5351 || i.index_reg->reg_type.bitfield.zmmword))
5352 {
5353 i.error = unsupported_vector_index_register;
5354 return 1;
5355 }
5356
5357 /* Check if default mask is allowed. */
5358 if (t->opcode_modifier.nodefmask
5359 && (!i.mask || i.mask->mask->reg_num == 0))
5360 {
5361 i.error = no_default_mask;
5362 return 1;
5363 }
5364
5365 /* For VSIB byte, we need a vector register for index, and all vector
5366 registers must be distinct. */
5367 if (t->opcode_modifier.vecsib)
5368 {
5369 if (!i.index_reg
5370 || !((t->opcode_modifier.vecsib == VecSIB128
5371 && i.index_reg->reg_type.bitfield.xmmword)
5372 || (t->opcode_modifier.vecsib == VecSIB256
5373 && i.index_reg->reg_type.bitfield.ymmword)
5374 || (t->opcode_modifier.vecsib == VecSIB512
5375 && i.index_reg->reg_type.bitfield.zmmword)))
5376 {
5377 i.error = invalid_vsib_address;
5378 return 1;
5379 }
5380
5381 gas_assert (i.reg_operands == 2 || i.mask);
5382 if (i.reg_operands == 2 && !i.mask)
5383 {
5384 gas_assert (i.types[0].bitfield.class == RegSIMD);
5385 gas_assert (i.types[0].bitfield.xmmword
5386 || i.types[0].bitfield.ymmword);
5387 gas_assert (i.types[2].bitfield.class == RegSIMD);
5388 gas_assert (i.types[2].bitfield.xmmword
5389 || i.types[2].bitfield.ymmword);
5390 if (operand_check == check_none)
5391 return 0;
5392 if (register_number (i.op[0].regs)
5393 != register_number (i.index_reg)
5394 && register_number (i.op[2].regs)
5395 != register_number (i.index_reg)
5396 && register_number (i.op[0].regs)
5397 != register_number (i.op[2].regs))
5398 return 0;
5399 if (operand_check == check_error)
5400 {
5401 i.error = invalid_vector_register_set;
5402 return 1;
5403 }
5404 as_warn (_("mask, index, and destination registers should be distinct"));
5405 }
5406 else if (i.reg_operands == 1 && i.mask)
5407 {
5408 if (i.types[1].bitfield.class == RegSIMD
5409 && (i.types[1].bitfield.xmmword
5410 || i.types[1].bitfield.ymmword
5411 || i.types[1].bitfield.zmmword)
5412 && (register_number (i.op[1].regs)
5413 == register_number (i.index_reg)))
5414 {
5415 if (operand_check == check_error)
5416 {
5417 i.error = invalid_vector_register_set;
5418 return 1;
5419 }
5420 if (operand_check != check_none)
5421 as_warn (_("index and destination registers should be distinct"));
5422 }
5423 }
5424 }
5425
5426 /* Check if broadcast is supported by the instruction and is applied
5427 to the memory operand. */
5428 if (i.broadcast)
5429 {
5430 i386_operand_type type, overlap;
5431
5432 /* Check if specified broadcast is supported in this instruction,
5433 and its broadcast bytes match the memory operand. */
5434 op = i.broadcast->operand;
5435 if (!t->opcode_modifier.broadcast
5436 || !(i.flags[op] & Operand_Mem)
5437 || (!i.types[op].bitfield.unspecified
5438 && !match_broadcast_size (t, op)))
5439 {
5440 bad_broadcast:
5441 i.error = unsupported_broadcast;
5442 return 1;
5443 }
5444
5445 i.broadcast->bytes = ((1 << (t->opcode_modifier.broadcast - 1))
5446 * i.broadcast->type);
5447 operand_type_set (&type, 0);
5448 switch (i.broadcast->bytes)
5449 {
5450 case 2:
5451 type.bitfield.word = 1;
5452 break;
5453 case 4:
5454 type.bitfield.dword = 1;
5455 break;
5456 case 8:
5457 type.bitfield.qword = 1;
5458 break;
5459 case 16:
5460 type.bitfield.xmmword = 1;
5461 break;
5462 case 32:
5463 type.bitfield.ymmword = 1;
5464 break;
5465 case 64:
5466 type.bitfield.zmmword = 1;
5467 break;
5468 default:
5469 goto bad_broadcast;
5470 }
5471
5472 overlap = operand_type_and (type, t->operand_types[op]);
5473 if (operand_type_all_zero (&overlap))
5474 goto bad_broadcast;
5475
5476 if (t->opcode_modifier.checkregsize)
5477 {
5478 unsigned int j;
5479
5480 type.bitfield.baseindex = 1;
5481 for (j = 0; j < i.operands; ++j)
5482 {
5483 if (j != op
5484 && !operand_type_register_match(i.types[j],
5485 t->operand_types[j],
5486 type,
5487 t->operand_types[op]))
5488 goto bad_broadcast;
5489 }
5490 }
5491 }
5492 /* If broadcast is supported in this instruction, we need to check if
5493 operand of one-element size isn't specified without broadcast. */
5494 else if (t->opcode_modifier.broadcast && i.mem_operands)
5495 {
5496 /* Find memory operand. */
5497 for (op = 0; op < i.operands; op++)
5498 if (i.flags[op] & Operand_Mem)
5499 break;
5500 gas_assert (op < i.operands);
5501 /* Check size of the memory operand. */
5502 if (match_broadcast_size (t, op))
5503 {
5504 i.error = broadcast_needed;
5505 return 1;
5506 }
5507 }
5508 else
5509 op = MAX_OPERANDS - 1; /* Avoid uninitialized variable warning. */
5510
5511 /* Check if requested masking is supported. */
5512 if (i.mask)
5513 {
5514 switch (t->opcode_modifier.masking)
5515 {
5516 case BOTH_MASKING:
5517 break;
5518 case MERGING_MASKING:
5519 if (i.mask->zeroing)
5520 {
5521 case 0:
5522 i.error = unsupported_masking;
5523 return 1;
5524 }
5525 break;
5526 case DYNAMIC_MASKING:
5527 /* Memory destinations allow only merging masking. */
5528 if (i.mask->zeroing && i.mem_operands)
5529 {
5530 /* Find memory operand. */
5531 for (op = 0; op < i.operands; op++)
5532 if (i.flags[op] & Operand_Mem)
5533 break;
5534 gas_assert (op < i.operands);
5535 if (op == i.operands - 1)
5536 {
5537 i.error = unsupported_masking;
5538 return 1;
5539 }
5540 }
5541 break;
5542 default:
5543 abort ();
5544 }
5545 }
5546
5547 /* Check if masking is applied to dest operand. */
5548 if (i.mask && (i.mask->operand != (int) (i.operands - 1)))
5549 {
5550 i.error = mask_not_on_destination;
5551 return 1;
5552 }
5553
5554 /* Check RC/SAE. */
5555 if (i.rounding)
5556 {
5557 if (!t->opcode_modifier.sae
5558 || (i.rounding->type != saeonly && !t->opcode_modifier.staticrounding))
5559 {
5560 i.error = unsupported_rc_sae;
5561 return 1;
5562 }
5563 /* If the instruction has several immediate operands and one of
5564 them is rounding, the rounding operand should be the last
5565 immediate operand. */
5566 if (i.imm_operands > 1
5567 && i.rounding->operand != (int) (i.imm_operands - 1))
5568 {
5569 i.error = rc_sae_operand_not_last_imm;
5570 return 1;
5571 }
5572 }
5573
5574 /* Check vector Disp8 operand. */
5575 if (t->opcode_modifier.disp8memshift
5576 && i.disp_encoding != disp_encoding_32bit)
5577 {
5578 if (i.broadcast)
5579 i.memshift = t->opcode_modifier.broadcast - 1;
5580 else if (t->opcode_modifier.disp8memshift != DISP8_SHIFT_VL)
5581 i.memshift = t->opcode_modifier.disp8memshift;
5582 else
5583 {
5584 const i386_operand_type *type = NULL;
5585
5586 i.memshift = 0;
5587 for (op = 0; op < i.operands; op++)
5588 if (i.flags[op] & Operand_Mem)
5589 {
5590 if (t->opcode_modifier.evex == EVEXLIG)
5591 i.memshift = 2 + (i.suffix == QWORD_MNEM_SUFFIX);
5592 else if (t->operand_types[op].bitfield.xmmword
5593 + t->operand_types[op].bitfield.ymmword
5594 + t->operand_types[op].bitfield.zmmword <= 1)
5595 type = &t->operand_types[op];
5596 else if (!i.types[op].bitfield.unspecified)
5597 type = &i.types[op];
5598 }
5599 else if (i.types[op].bitfield.class == RegSIMD
5600 && t->opcode_modifier.evex != EVEXLIG)
5601 {
5602 if (i.types[op].bitfield.zmmword)
5603 i.memshift = 6;
5604 else if (i.types[op].bitfield.ymmword && i.memshift < 5)
5605 i.memshift = 5;
5606 else if (i.types[op].bitfield.xmmword && i.memshift < 4)
5607 i.memshift = 4;
5608 }
5609
5610 if (type)
5611 {
5612 if (type->bitfield.zmmword)
5613 i.memshift = 6;
5614 else if (type->bitfield.ymmword)
5615 i.memshift = 5;
5616 else if (type->bitfield.xmmword)
5617 i.memshift = 4;
5618 }
5619
5620 /* For the check in fits_in_disp8(). */
5621 if (i.memshift == 0)
5622 i.memshift = -1;
5623 }
5624
5625 for (op = 0; op < i.operands; op++)
5626 if (operand_type_check (i.types[op], disp)
5627 && i.op[op].disps->X_op == O_constant)
5628 {
5629 if (fits_in_disp8 (i.op[op].disps->X_add_number))
5630 {
5631 i.types[op].bitfield.disp8 = 1;
5632 return 0;
5633 }
5634 i.types[op].bitfield.disp8 = 0;
5635 }
5636 }
5637
5638 i.memshift = 0;
5639
5640 return 0;
5641 }
5642
5643 /* Check if operands are valid for the instruction. Update VEX
5644 operand types. */
5645
5646 static int
5647 VEX_check_operands (const insn_template *t)
5648 {
5649 if (i.vec_encoding == vex_encoding_evex)
5650 {
5651 /* This instruction must be encoded with EVEX prefix. */
5652 if (!is_evex_encoding (t))
5653 {
5654 i.error = unsupported;
5655 return 1;
5656 }
5657 return 0;
5658 }
5659
5660 if (!t->opcode_modifier.vex)
5661 {
5662 /* This instruction template doesn't have VEX prefix. */
5663 if (i.vec_encoding != vex_encoding_default)
5664 {
5665 i.error = unsupported;
5666 return 1;
5667 }
5668 return 0;
5669 }
5670
5671 /* Check the special Imm4 cases; must be the first operand. */
5672 if (t->cpu_flags.bitfield.cpuxop && t->operands == 5)
5673 {
5674 if (i.op[0].imms->X_op != O_constant
5675 || !fits_in_imm4 (i.op[0].imms->X_add_number))
5676 {
5677 i.error = bad_imm4;
5678 return 1;
5679 }
5680
5681 /* Turn off Imm<N> so that update_imm won't complain. */
5682 operand_type_set (&i.types[0], 0);
5683 }
5684
5685 return 0;
5686 }
5687
5688 static const insn_template *
5689 match_template (char mnem_suffix)
5690 {
5691 /* Points to template once we've found it. */
5692 const insn_template *t;
5693 i386_operand_type overlap0, overlap1, overlap2, overlap3;
5694 i386_operand_type overlap4;
5695 unsigned int found_reverse_match;
5696 i386_opcode_modifier suffix_check;
5697 i386_operand_type operand_types [MAX_OPERANDS];
5698 int addr_prefix_disp;
5699 unsigned int j;
5700 unsigned int found_cpu_match, size_match;
5701 unsigned int check_register;
5702 enum i386_error specific_error = 0;
5703
5704 #if MAX_OPERANDS != 5
5705 # error "MAX_OPERANDS must be 5."
5706 #endif
5707
5708 found_reverse_match = 0;
5709 addr_prefix_disp = -1;
5710
5711 /* Prepare for mnemonic suffix check. */
5712 memset (&suffix_check, 0, sizeof (suffix_check));
5713 switch (mnem_suffix)
5714 {
5715 case BYTE_MNEM_SUFFIX:
5716 suffix_check.no_bsuf = 1;
5717 break;
5718 case WORD_MNEM_SUFFIX:
5719 suffix_check.no_wsuf = 1;
5720 break;
5721 case SHORT_MNEM_SUFFIX:
5722 suffix_check.no_ssuf = 1;
5723 break;
5724 case LONG_MNEM_SUFFIX:
5725 suffix_check.no_lsuf = 1;
5726 break;
5727 case QWORD_MNEM_SUFFIX:
5728 suffix_check.no_qsuf = 1;
5729 break;
5730 default:
5731 /* NB: In Intel syntax, normally we can check for memory operand
5732 size when there is no mnemonic suffix. But jmp and call have
5733 2 different encodings with Dword memory operand size, one with
5734 No_ldSuf and the other without. i.suffix is set to
5735 LONG_DOUBLE_MNEM_SUFFIX to skip the one with No_ldSuf. */
5736 if (i.suffix == LONG_DOUBLE_MNEM_SUFFIX)
5737 suffix_check.no_ldsuf = 1;
5738 }
5739
5740 /* Must have right number of operands. */
5741 i.error = number_of_operands_mismatch;
5742
5743 for (t = current_templates->start; t < current_templates->end; t++)
5744 {
5745 addr_prefix_disp = -1;
5746 found_reverse_match = 0;
5747
5748 if (i.operands != t->operands)
5749 continue;
5750
5751 /* Check processor support. */
5752 i.error = unsupported;
5753 found_cpu_match = (cpu_flags_match (t)
5754 == CPU_FLAGS_PERFECT_MATCH);
5755 if (!found_cpu_match)
5756 continue;
5757
5758 /* Check AT&T mnemonic. */
5759 i.error = unsupported_with_intel_mnemonic;
5760 if (intel_mnemonic && t->opcode_modifier.attmnemonic)
5761 continue;
5762
5763 /* Check AT&T/Intel syntax and Intel64/AMD64 ISA. */
5764 i.error = unsupported_syntax;
5765 if ((intel_syntax && t->opcode_modifier.attsyntax)
5766 || (!intel_syntax && t->opcode_modifier.intelsyntax)
5767 || (intel64 && t->opcode_modifier.amd64)
5768 || (!intel64 && t->opcode_modifier.intel64))
5769 continue;
5770
5771 /* Check the suffix. */
5772 i.error = invalid_instruction_suffix;
5773 if ((t->opcode_modifier.no_bsuf && suffix_check.no_bsuf)
5774 || (t->opcode_modifier.no_wsuf && suffix_check.no_wsuf)
5775 || (t->opcode_modifier.no_lsuf && suffix_check.no_lsuf)
5776 || (t->opcode_modifier.no_ssuf && suffix_check.no_ssuf)
5777 || (t->opcode_modifier.no_qsuf && suffix_check.no_qsuf)
5778 || (t->opcode_modifier.no_ldsuf && suffix_check.no_ldsuf))
5779 continue;
5780
5781 size_match = operand_size_match (t);
5782 if (!size_match)
5783 continue;
5784
5785 for (j = 0; j < MAX_OPERANDS; j++)
5786 operand_types[j] = t->operand_types[j];
5787
5788 /* In general, don't allow 64-bit operands in 32-bit mode. */
5789 if (i.suffix == QWORD_MNEM_SUFFIX
5790 && flag_code != CODE_64BIT
5791 && (intel_syntax
5792 ? (!t->opcode_modifier.ignoresize
5793 && !t->opcode_modifier.broadcast
5794 && !intel_float_operand (t->name))
5795 : intel_float_operand (t->name) != 2)
5796 && ((operand_types[0].bitfield.class != RegMMX
5797 && operand_types[0].bitfield.class != RegSIMD)
5798 || (operand_types[t->operands > 1].bitfield.class != RegMMX
5799 && operand_types[t->operands > 1].bitfield.class != RegSIMD))
5800 && (t->base_opcode != 0x0fc7
5801 || t->extension_opcode != 1 /* cmpxchg8b */))
5802 continue;
5803
5804 /* In general, don't allow 32-bit operands on pre-386. */
5805 else if (i.suffix == LONG_MNEM_SUFFIX
5806 && !cpu_arch_flags.bitfield.cpui386
5807 && (intel_syntax
5808 ? (!t->opcode_modifier.ignoresize
5809 && !intel_float_operand (t->name))
5810 : intel_float_operand (t->name) != 2)
5811 && ((operand_types[0].bitfield.class != RegMMX
5812 && operand_types[0].bitfield.class != RegSIMD)
5813 || (operand_types[t->operands > 1].bitfield.class != RegMMX
5814 && operand_types[t->operands > 1].bitfield.class
5815 != RegSIMD)))
5816 continue;
5817
5818 /* Do not verify operands when there are none. */
5819 else
5820 {
5821 if (!t->operands)
5822 /* We've found a match; break out of loop. */
5823 break;
5824 }
5825
5826 /* Address size prefix will turn Disp64/Disp32/Disp16 operand
5827 into Disp32/Disp16/Disp32 operand. */
5828 if (i.prefix[ADDR_PREFIX] != 0)
5829 {
5830 /* There should be only one Disp operand. */
5831 switch (flag_code)
5832 {
5833 case CODE_16BIT:
5834 for (j = 0; j < MAX_OPERANDS; j++)
5835 {
5836 if (operand_types[j].bitfield.disp16)
5837 {
5838 addr_prefix_disp = j;
5839 operand_types[j].bitfield.disp32 = 1;
5840 operand_types[j].bitfield.disp16 = 0;
5841 break;
5842 }
5843 }
5844 break;
5845 case CODE_32BIT:
5846 for (j = 0; j < MAX_OPERANDS; j++)
5847 {
5848 if (operand_types[j].bitfield.disp32)
5849 {
5850 addr_prefix_disp = j;
5851 operand_types[j].bitfield.disp32 = 0;
5852 operand_types[j].bitfield.disp16 = 1;
5853 break;
5854 }
5855 }
5856 break;
5857 case CODE_64BIT:
5858 for (j = 0; j < MAX_OPERANDS; j++)
5859 {
5860 if (operand_types[j].bitfield.disp64)
5861 {
5862 addr_prefix_disp = j;
5863 operand_types[j].bitfield.disp64 = 0;
5864 operand_types[j].bitfield.disp32 = 1;
5865 break;
5866 }
5867 }
5868 break;
5869 }
5870 }
5871
5872 /* Force 0x8b encoding for "mov foo@GOT, %eax". */
5873 if (i.reloc[0] == BFD_RELOC_386_GOT32 && t->base_opcode == 0xa0)
5874 continue;
5875
5876 /* We check register size if needed. */
5877 if (t->opcode_modifier.checkregsize)
5878 {
5879 check_register = (1 << t->operands) - 1;
5880 if (i.broadcast)
5881 check_register &= ~(1 << i.broadcast->operand);
5882 }
5883 else
5884 check_register = 0;
5885
5886 overlap0 = operand_type_and (i.types[0], operand_types[0]);
5887 switch (t->operands)
5888 {
5889 case 1:
5890 if (!operand_type_match (overlap0, i.types[0]))
5891 continue;
5892 break;
5893 case 2:
5894 /* xchg %eax, %eax is a special case. It is an alias for nop
5895 only in 32bit mode and we can use opcode 0x90. In 64bit
5896 mode, we can't use 0x90 for xchg %eax, %eax since it should
5897 zero-extend %eax to %rax. */
5898 if (flag_code == CODE_64BIT
5899 && t->base_opcode == 0x90
5900 && i.types[0].bitfield.acc && i.types[0].bitfield.dword
5901 && i.types[1].bitfield.acc && i.types[1].bitfield.dword)
5902 continue;
5903 /* xrelease mov %eax, <disp> is another special case. It must not
5904 match the accumulator-only encoding of mov. */
5905 if (flag_code != CODE_64BIT
5906 && i.hle_prefix
5907 && t->base_opcode == 0xa0
5908 && i.types[0].bitfield.acc
5909 && (i.flags[1] & Operand_Mem))
5910 continue;
5911 /* Fall through. */
5912
5913 case 3:
5914 if (!(size_match & MATCH_STRAIGHT))
5915 goto check_reverse;
5916 /* Reverse direction of operands if swapping is possible in the first
5917 place (operands need to be symmetric) and
5918 - the load form is requested, and the template is a store form,
5919 - the store form is requested, and the template is a load form,
5920 - the non-default (swapped) form is requested. */
5921 overlap1 = operand_type_and (operand_types[0], operand_types[1]);
5922 if (t->opcode_modifier.d && i.reg_operands == i.operands
5923 && !operand_type_all_zero (&overlap1))
5924 switch (i.dir_encoding)
5925 {
5926 case dir_encoding_load:
5927 if (operand_type_check (operand_types[i.operands - 1], anymem)
5928 || t->opcode_modifier.regmem)
5929 goto check_reverse;
5930 break;
5931
5932 case dir_encoding_store:
5933 if (!operand_type_check (operand_types[i.operands - 1], anymem)
5934 && !t->opcode_modifier.regmem)
5935 goto check_reverse;
5936 break;
5937
5938 case dir_encoding_swap:
5939 goto check_reverse;
5940
5941 case dir_encoding_default:
5942 break;
5943 }
5944 /* If we want store form, we skip the current load. */
5945 if ((i.dir_encoding == dir_encoding_store
5946 || i.dir_encoding == dir_encoding_swap)
5947 && i.mem_operands == 0
5948 && t->opcode_modifier.load)
5949 continue;
5950 /* Fall through. */
5951 case 4:
5952 case 5:
5953 overlap1 = operand_type_and (i.types[1], operand_types[1]);
5954 if (!operand_type_match (overlap0, i.types[0])
5955 || !operand_type_match (overlap1, i.types[1])
5956 || ((check_register & 3) == 3
5957 && !operand_type_register_match (i.types[0],
5958 operand_types[0],
5959 i.types[1],
5960 operand_types[1])))
5961 {
5962 /* Check if other direction is valid ... */
5963 if (!t->opcode_modifier.d)
5964 continue;
5965
5966 check_reverse:
5967 if (!(size_match & MATCH_REVERSE))
5968 continue;
5969 /* Try reversing direction of operands. */
5970 overlap0 = operand_type_and (i.types[0], operand_types[i.operands - 1]);
5971 overlap1 = operand_type_and (i.types[i.operands - 1], operand_types[0]);
5972 if (!operand_type_match (overlap0, i.types[0])
5973 || !operand_type_match (overlap1, i.types[i.operands - 1])
5974 || (check_register
5975 && !operand_type_register_match (i.types[0],
5976 operand_types[i.operands - 1],
5977 i.types[i.operands - 1],
5978 operand_types[0])))
5979 {
5980 /* Does not match either direction. */
5981 continue;
5982 }
5983 /* found_reverse_match holds which of D or FloatR
5984 we've found. */
5985 if (!t->opcode_modifier.d)
5986 found_reverse_match = 0;
5987 else if (operand_types[0].bitfield.tbyte)
5988 found_reverse_match = Opcode_FloatD;
5989 else if (operand_types[0].bitfield.xmmword
5990 || operand_types[i.operands - 1].bitfield.xmmword
5991 || operand_types[0].bitfield.class == RegMMX
5992 || operand_types[i.operands - 1].bitfield.class == RegMMX
5993 || is_any_vex_encoding(t))
5994 found_reverse_match = (t->base_opcode & 0xee) != 0x6e
5995 ? Opcode_SIMD_FloatD : Opcode_SIMD_IntD;
5996 else
5997 found_reverse_match = Opcode_D;
5998 if (t->opcode_modifier.floatr)
5999 found_reverse_match |= Opcode_FloatR;
6000 }
6001 else
6002 {
6003 /* Found a forward 2 operand match here. */
6004 switch (t->operands)
6005 {
6006 case 5:
6007 overlap4 = operand_type_and (i.types[4],
6008 operand_types[4]);
6009 /* Fall through. */
6010 case 4:
6011 overlap3 = operand_type_and (i.types[3],
6012 operand_types[3]);
6013 /* Fall through. */
6014 case 3:
6015 overlap2 = operand_type_and (i.types[2],
6016 operand_types[2]);
6017 break;
6018 }
6019
6020 switch (t->operands)
6021 {
6022 case 5:
6023 if (!operand_type_match (overlap4, i.types[4])
6024 || !operand_type_register_match (i.types[3],
6025 operand_types[3],
6026 i.types[4],
6027 operand_types[4]))
6028 continue;
6029 /* Fall through. */
6030 case 4:
6031 if (!operand_type_match (overlap3, i.types[3])
6032 || ((check_register & 0xa) == 0xa
6033 && !operand_type_register_match (i.types[1],
6034 operand_types[1],
6035 i.types[3],
6036 operand_types[3]))
6037 || ((check_register & 0xc) == 0xc
6038 && !operand_type_register_match (i.types[2],
6039 operand_types[2],
6040 i.types[3],
6041 operand_types[3])))
6042 continue;
6043 /* Fall through. */
6044 case 3:
6045 /* Here we make use of the fact that there are no
6046 reverse match 3 operand instructions. */
6047 if (!operand_type_match (overlap2, i.types[2])
6048 || ((check_register & 5) == 5
6049 && !operand_type_register_match (i.types[0],
6050 operand_types[0],
6051 i.types[2],
6052 operand_types[2]))
6053 || ((check_register & 6) == 6
6054 && !operand_type_register_match (i.types[1],
6055 operand_types[1],
6056 i.types[2],
6057 operand_types[2])))
6058 continue;
6059 break;
6060 }
6061 }
6062 /* Found either forward/reverse 2, 3 or 4 operand match here:
6063 slip through to break. */
6064 }
6065 if (!found_cpu_match)
6066 continue;
6067
6068 /* Check if vector and VEX operands are valid. */
6069 if (check_VecOperands (t) || VEX_check_operands (t))
6070 {
6071 specific_error = i.error;
6072 continue;
6073 }
6074
6075 /* We've found a match; break out of loop. */
6076 break;
6077 }
6078
6079 if (t == current_templates->end)
6080 {
6081 /* We found no match. */
6082 const char *err_msg;
6083 switch (specific_error ? specific_error : i.error)
6084 {
6085 default:
6086 abort ();
6087 case operand_size_mismatch:
6088 err_msg = _("operand size mismatch");
6089 break;
6090 case operand_type_mismatch:
6091 err_msg = _("operand type mismatch");
6092 break;
6093 case register_type_mismatch:
6094 err_msg = _("register type mismatch");
6095 break;
6096 case number_of_operands_mismatch:
6097 err_msg = _("number of operands mismatch");
6098 break;
6099 case invalid_instruction_suffix:
6100 err_msg = _("invalid instruction suffix");
6101 break;
6102 case bad_imm4:
6103 err_msg = _("constant doesn't fit in 4 bits");
6104 break;
6105 case unsupported_with_intel_mnemonic:
6106 err_msg = _("unsupported with Intel mnemonic");
6107 break;
6108 case unsupported_syntax:
6109 err_msg = _("unsupported syntax");
6110 break;
6111 case unsupported:
6112 as_bad (_("unsupported instruction `%s'"),
6113 current_templates->start->name);
6114 return NULL;
6115 case invalid_vsib_address:
6116 err_msg = _("invalid VSIB address");
6117 break;
6118 case invalid_vector_register_set:
6119 err_msg = _("mask, index, and destination registers must be distinct");
6120 break;
6121 case unsupported_vector_index_register:
6122 err_msg = _("unsupported vector index register");
6123 break;
6124 case unsupported_broadcast:
6125 err_msg = _("unsupported broadcast");
6126 break;
6127 case broadcast_needed:
6128 err_msg = _("broadcast is needed for operand of such type");
6129 break;
6130 case unsupported_masking:
6131 err_msg = _("unsupported masking");
6132 break;
6133 case mask_not_on_destination:
6134 err_msg = _("mask not on destination operand");
6135 break;
6136 case no_default_mask:
6137 err_msg = _("default mask isn't allowed");
6138 break;
6139 case unsupported_rc_sae:
6140 err_msg = _("unsupported static rounding/sae");
6141 break;
6142 case rc_sae_operand_not_last_imm:
6143 if (intel_syntax)
6144 err_msg = _("RC/SAE operand must precede immediate operands");
6145 else
6146 err_msg = _("RC/SAE operand must follow immediate operands");
6147 break;
6148 case invalid_register_operand:
6149 err_msg = _("invalid register operand");
6150 break;
6151 }
6152 as_bad (_("%s for `%s'"), err_msg,
6153 current_templates->start->name);
6154 return NULL;
6155 }
6156
6157 if (!quiet_warnings)
6158 {
6159 if (!intel_syntax
6160 && (i.types[0].bitfield.jumpabsolute
6161 != operand_types[0].bitfield.jumpabsolute))
6162 {
6163 as_warn (_("indirect %s without `*'"), t->name);
6164 }
6165
6166 if (t->opcode_modifier.isprefix
6167 && t->opcode_modifier.ignoresize)
6168 {
6169 /* Warn them that a data or address size prefix doesn't
6170 affect assembly of the next line of code. */
6171 as_warn (_("stand-alone `%s' prefix"), t->name);
6172 }
6173 }
6174
6175 /* Copy the template we found. */
6176 i.tm = *t;
6177
6178 if (addr_prefix_disp != -1)
6179 i.tm.operand_types[addr_prefix_disp]
6180 = operand_types[addr_prefix_disp];
6181
6182 if (found_reverse_match)
6183 {
6184 /* If we found a reverse match we must alter the opcode direction
6185 bit and clear/flip the regmem modifier one. found_reverse_match
6186 holds bits to change (different for int & float insns). */
6187
6188 i.tm.base_opcode ^= found_reverse_match;
6189
6190 i.tm.operand_types[0] = operand_types[i.operands - 1];
6191 i.tm.operand_types[i.operands - 1] = operand_types[0];
6192
6193 /* Certain SIMD insns have their load forms specified in the opcode
6194 table, and hence we need to _set_ RegMem instead of clearing it.
6195 We need to avoid setting the bit though on insns like KMOVW. */
6196 i.tm.opcode_modifier.regmem
6197 = i.tm.opcode_modifier.modrm && i.tm.opcode_modifier.d
6198 && i.tm.operands > 2U - i.tm.opcode_modifier.sse2avx
6199 && !i.tm.opcode_modifier.regmem;
6200 }
6201
6202 return t;
6203 }
6204
6205 static int
6206 check_string (void)
6207 {
6208 unsigned int mem_op = i.flags[0] & Operand_Mem ? 0 : 1;
6209
6210 if (i.tm.operand_types[mem_op].bitfield.esseg)
6211 {
6212 if (i.seg[0] != NULL && i.seg[0] != &es)
6213 {
6214 as_bad (_("`%s' operand %d must use `%ses' segment"),
6215 i.tm.name,
6216 intel_syntax ? i.tm.operands - mem_op : mem_op + 1,
6217 register_prefix);
6218 return 0;
6219 }
6220 /* There's only ever one segment override allowed per instruction.
6221 This instruction possibly has a legal segment override on the
6222 second operand, so copy the segment to where non-string
6223 instructions store it, allowing common code. */
6224 i.seg[0] = i.seg[1];
6225 }
6226 else if (i.tm.operand_types[mem_op + 1].bitfield.esseg)
6227 {
6228 if (i.seg[1] != NULL && i.seg[1] != &es)
6229 {
6230 as_bad (_("`%s' operand %d must use `%ses' segment"),
6231 i.tm.name,
6232 intel_syntax ? i.tm.operands - mem_op - 1 : mem_op + 2,
6233 register_prefix);
6234 return 0;
6235 }
6236 }
6237 return 1;
6238 }
6239
6240 static int
6241 process_suffix (void)
6242 {
6243 /* If matched instruction specifies an explicit instruction mnemonic
6244 suffix, use it. */
6245 if (i.tm.opcode_modifier.size == SIZE16)
6246 i.suffix = WORD_MNEM_SUFFIX;
6247 else if (i.tm.opcode_modifier.size == SIZE32)
6248 i.suffix = LONG_MNEM_SUFFIX;
6249 else if (i.tm.opcode_modifier.size == SIZE64)
6250 i.suffix = QWORD_MNEM_SUFFIX;
6251 else if (i.reg_operands)
6252 {
6253 /* If there's no instruction mnemonic suffix we try to invent one
6254 based on register operands. */
6255 if (!i.suffix)
6256 {
6257 /* We take i.suffix from the last register operand specified,
6258 Destination register type is more significant than source
6259 register type. crc32 in SSE4.2 prefers source register
6260 type. */
6261 if (i.tm.base_opcode == 0xf20f38f0
6262 && i.types[0].bitfield.class == Reg)
6263 {
6264 if (i.types[0].bitfield.byte)
6265 i.suffix = BYTE_MNEM_SUFFIX;
6266 else if (i.types[0].bitfield.word)
6267 i.suffix = WORD_MNEM_SUFFIX;
6268 else if (i.types[0].bitfield.dword)
6269 i.suffix = LONG_MNEM_SUFFIX;
6270 else if (i.types[0].bitfield.qword)
6271 i.suffix = QWORD_MNEM_SUFFIX;
6272 }
6273
6274 if (!i.suffix)
6275 {
6276 int op;
6277
6278 if (i.tm.base_opcode == 0xf20f38f0)
6279 {
6280 /* We have to know the operand size for crc32. */
6281 as_bad (_("ambiguous memory operand size for `%s`"),
6282 i.tm.name);
6283 return 0;
6284 }
6285
6286 for (op = i.operands; --op >= 0;)
6287 if (!i.tm.operand_types[op].bitfield.inoutportreg
6288 && !i.tm.operand_types[op].bitfield.shiftcount)
6289 {
6290 if (i.types[op].bitfield.class != Reg)
6291 continue;
6292 if (i.types[op].bitfield.byte)
6293 i.suffix = BYTE_MNEM_SUFFIX;
6294 else if (i.types[op].bitfield.word)
6295 i.suffix = WORD_MNEM_SUFFIX;
6296 else if (i.types[op].bitfield.dword)
6297 i.suffix = LONG_MNEM_SUFFIX;
6298 else if (i.types[op].bitfield.qword)
6299 i.suffix = QWORD_MNEM_SUFFIX;
6300 else
6301 continue;
6302 break;
6303 }
6304 }
6305 }
6306 else if (i.suffix == BYTE_MNEM_SUFFIX)
6307 {
6308 if (intel_syntax
6309 && i.tm.opcode_modifier.ignoresize
6310 && i.tm.opcode_modifier.no_bsuf)
6311 i.suffix = 0;
6312 else if (!check_byte_reg ())
6313 return 0;
6314 }
6315 else if (i.suffix == LONG_MNEM_SUFFIX)
6316 {
6317 if (intel_syntax
6318 && i.tm.opcode_modifier.ignoresize
6319 && i.tm.opcode_modifier.no_lsuf
6320 && !i.tm.opcode_modifier.todword
6321 && !i.tm.opcode_modifier.toqword)
6322 i.suffix = 0;
6323 else if (!check_long_reg ())
6324 return 0;
6325 }
6326 else if (i.suffix == QWORD_MNEM_SUFFIX)
6327 {
6328 if (intel_syntax
6329 && i.tm.opcode_modifier.ignoresize
6330 && i.tm.opcode_modifier.no_qsuf
6331 && !i.tm.opcode_modifier.todword
6332 && !i.tm.opcode_modifier.toqword)
6333 i.suffix = 0;
6334 else if (!check_qword_reg ())
6335 return 0;
6336 }
6337 else if (i.suffix == WORD_MNEM_SUFFIX)
6338 {
6339 if (intel_syntax
6340 && i.tm.opcode_modifier.ignoresize
6341 && i.tm.opcode_modifier.no_wsuf)
6342 i.suffix = 0;
6343 else if (!check_word_reg ())
6344 return 0;
6345 }
6346 else if (intel_syntax && i.tm.opcode_modifier.ignoresize)
6347 /* Do nothing if the instruction is going to ignore the prefix. */
6348 ;
6349 else
6350 abort ();
6351 }
6352 else if (i.tm.opcode_modifier.defaultsize
6353 && !i.suffix
6354 /* exclude fldenv/frstor/fsave/fstenv */
6355 && i.tm.opcode_modifier.no_ssuf)
6356 {
6357 if (stackop_size == LONG_MNEM_SUFFIX
6358 && i.tm.base_opcode == 0xcf)
6359 {
6360 /* stackop_size is set to LONG_MNEM_SUFFIX for the
6361 .code16gcc directive to support 16-bit mode with
6362 32-bit address. For IRET without a suffix, generate
6363 16-bit IRET (opcode 0xcf) to return from an interrupt
6364 handler. */
6365 i.suffix = WORD_MNEM_SUFFIX;
6366 as_warn (_("generating 16-bit `iret' for .code16gcc directive"));
6367 }
6368 else
6369 i.suffix = stackop_size;
6370 }
6371 else if (intel_syntax
6372 && !i.suffix
6373 && (i.tm.operand_types[0].bitfield.jumpabsolute
6374 || i.tm.opcode_modifier.jumpbyte
6375 || i.tm.opcode_modifier.jumpintersegment
6376 || (i.tm.base_opcode == 0x0f01 /* [ls][gi]dt */
6377 && i.tm.extension_opcode <= 3)))
6378 {
6379 switch (flag_code)
6380 {
6381 case CODE_64BIT:
6382 if (!i.tm.opcode_modifier.no_qsuf)
6383 {
6384 i.suffix = QWORD_MNEM_SUFFIX;
6385 break;
6386 }
6387 /* Fall through. */
6388 case CODE_32BIT:
6389 if (!i.tm.opcode_modifier.no_lsuf)
6390 i.suffix = LONG_MNEM_SUFFIX;
6391 break;
6392 case CODE_16BIT:
6393 if (!i.tm.opcode_modifier.no_wsuf)
6394 i.suffix = WORD_MNEM_SUFFIX;
6395 break;
6396 }
6397 }
6398
6399 if (!i.suffix)
6400 {
6401 if (!intel_syntax)
6402 {
6403 if (i.tm.opcode_modifier.w)
6404 {
6405 as_bad (_("no instruction mnemonic suffix given and "
6406 "no register operands; can't size instruction"));
6407 return 0;
6408 }
6409 }
6410 else
6411 {
6412 unsigned int suffixes;
6413
6414 suffixes = !i.tm.opcode_modifier.no_bsuf;
6415 if (!i.tm.opcode_modifier.no_wsuf)
6416 suffixes |= 1 << 1;
6417 if (!i.tm.opcode_modifier.no_lsuf)
6418 suffixes |= 1 << 2;
6419 if (!i.tm.opcode_modifier.no_ldsuf)
6420 suffixes |= 1 << 3;
6421 if (!i.tm.opcode_modifier.no_ssuf)
6422 suffixes |= 1 << 4;
6423 if (flag_code == CODE_64BIT && !i.tm.opcode_modifier.no_qsuf)
6424 suffixes |= 1 << 5;
6425
6426 /* There are more than suffix matches. */
6427 if (i.tm.opcode_modifier.w
6428 || ((suffixes & (suffixes - 1))
6429 && !i.tm.opcode_modifier.defaultsize
6430 && !i.tm.opcode_modifier.ignoresize))
6431 {
6432 as_bad (_("ambiguous operand size for `%s'"), i.tm.name);
6433 return 0;
6434 }
6435 }
6436 }
6437
6438 /* Change the opcode based on the operand size given by i.suffix. */
6439 switch (i.suffix)
6440 {
6441 /* Size floating point instruction. */
6442 case LONG_MNEM_SUFFIX:
6443 if (i.tm.opcode_modifier.floatmf)
6444 {
6445 i.tm.base_opcode ^= 4;
6446 break;
6447 }
6448 /* fall through */
6449 case WORD_MNEM_SUFFIX:
6450 case QWORD_MNEM_SUFFIX:
6451 /* It's not a byte, select word/dword operation. */
6452 if (i.tm.opcode_modifier.w)
6453 {
6454 if (i.tm.opcode_modifier.shortform)
6455 i.tm.base_opcode |= 8;
6456 else
6457 i.tm.base_opcode |= 1;
6458 }
6459 /* fall through */
6460 case SHORT_MNEM_SUFFIX:
6461 /* Now select between word & dword operations via the operand
6462 size prefix, except for instructions that will ignore this
6463 prefix anyway. */
6464 if (i.reg_operands > 0
6465 && i.types[0].bitfield.class == Reg
6466 && i.tm.opcode_modifier.addrprefixopreg
6467 && (i.tm.opcode_modifier.immext
6468 || i.operands == 1))
6469 {
6470 /* The address size override prefix changes the size of the
6471 first operand. */
6472 if ((flag_code == CODE_32BIT
6473 && i.op[0].regs->reg_type.bitfield.word)
6474 || (flag_code != CODE_32BIT
6475 && i.op[0].regs->reg_type.bitfield.dword))
6476 if (!add_prefix (ADDR_PREFIX_OPCODE))
6477 return 0;
6478 }
6479 else if (i.suffix != QWORD_MNEM_SUFFIX
6480 && !i.tm.opcode_modifier.ignoresize
6481 && !i.tm.opcode_modifier.floatmf
6482 && !is_any_vex_encoding (&i.tm)
6483 && ((i.suffix == LONG_MNEM_SUFFIX) == (flag_code == CODE_16BIT)
6484 || (flag_code == CODE_64BIT
6485 && i.tm.opcode_modifier.jumpbyte)))
6486 {
6487 unsigned int prefix = DATA_PREFIX_OPCODE;
6488
6489 if (i.tm.opcode_modifier.jumpbyte) /* jcxz, loop */
6490 prefix = ADDR_PREFIX_OPCODE;
6491
6492 if (!add_prefix (prefix))
6493 return 0;
6494 }
6495
6496 /* Set mode64 for an operand. */
6497 if (i.suffix == QWORD_MNEM_SUFFIX
6498 && flag_code == CODE_64BIT
6499 && !i.tm.opcode_modifier.norex64
6500 /* Special case for xchg %rax,%rax. It is NOP and doesn't
6501 need rex64. */
6502 && ! (i.operands == 2
6503 && i.tm.base_opcode == 0x90
6504 && i.tm.extension_opcode == None
6505 && i.types[0].bitfield.acc && i.types[0].bitfield.qword
6506 && i.types[1].bitfield.acc && i.types[1].bitfield.qword))
6507 i.rex |= REX_W;
6508
6509 break;
6510 }
6511
6512 if (i.reg_operands != 0
6513 && i.operands > 1
6514 && i.tm.opcode_modifier.addrprefixopreg
6515 && !i.tm.opcode_modifier.immext)
6516 {
6517 /* Check invalid register operand when the address size override
6518 prefix changes the size of register operands. */
6519 unsigned int op;
6520 enum { need_word, need_dword, need_qword } need;
6521
6522 if (flag_code == CODE_32BIT)
6523 need = i.prefix[ADDR_PREFIX] ? need_word : need_dword;
6524 else
6525 {
6526 if (i.prefix[ADDR_PREFIX])
6527 need = need_dword;
6528 else
6529 need = flag_code == CODE_64BIT ? need_qword : need_word;
6530 }
6531
6532 for (op = 0; op < i.operands; op++)
6533 if (i.types[op].bitfield.class == Reg
6534 && ((need == need_word
6535 && !i.op[op].regs->reg_type.bitfield.word)
6536 || (need == need_dword
6537 && !i.op[op].regs->reg_type.bitfield.dword)
6538 || (need == need_qword
6539 && !i.op[op].regs->reg_type.bitfield.qword)))
6540 {
6541 as_bad (_("invalid register operand size for `%s'"),
6542 i.tm.name);
6543 return 0;
6544 }
6545 }
6546
6547 return 1;
6548 }
6549
6550 static int
6551 check_byte_reg (void)
6552 {
6553 int op;
6554
6555 for (op = i.operands; --op >= 0;)
6556 {
6557 /* Skip non-register operands. */
6558 if (i.types[op].bitfield.class != Reg)
6559 continue;
6560
6561 /* If this is an eight bit register, it's OK. If it's the 16 or
6562 32 bit version of an eight bit register, we will just use the
6563 low portion, and that's OK too. */
6564 if (i.types[op].bitfield.byte)
6565 continue;
6566
6567 /* I/O port address operands are OK too. */
6568 if (i.tm.operand_types[op].bitfield.inoutportreg)
6569 continue;
6570
6571 /* crc32 doesn't generate this warning. */
6572 if (i.tm.base_opcode == 0xf20f38f0)
6573 continue;
6574
6575 if ((i.types[op].bitfield.word
6576 || i.types[op].bitfield.dword
6577 || i.types[op].bitfield.qword)
6578 && i.op[op].regs->reg_num < 4
6579 /* Prohibit these changes in 64bit mode, since the lowering
6580 would be more complicated. */
6581 && flag_code != CODE_64BIT)
6582 {
6583 #if REGISTER_WARNINGS
6584 if (!quiet_warnings)
6585 as_warn (_("using `%s%s' instead of `%s%s' due to `%c' suffix"),
6586 register_prefix,
6587 (i.op[op].regs + (i.types[op].bitfield.word
6588 ? REGNAM_AL - REGNAM_AX
6589 : REGNAM_AL - REGNAM_EAX))->reg_name,
6590 register_prefix,
6591 i.op[op].regs->reg_name,
6592 i.suffix);
6593 #endif
6594 continue;
6595 }
6596 /* Any other register is bad. */
6597 if (i.types[op].bitfield.class == Reg
6598 || i.types[op].bitfield.class == RegMMX
6599 || i.types[op].bitfield.class == RegSIMD
6600 || i.types[op].bitfield.class == SReg
6601 || i.types[op].bitfield.class == RegCR
6602 || i.types[op].bitfield.class == RegDR
6603 || i.types[op].bitfield.class == RegTR)
6604 {
6605 as_bad (_("`%s%s' not allowed with `%s%c'"),
6606 register_prefix,
6607 i.op[op].regs->reg_name,
6608 i.tm.name,
6609 i.suffix);
6610 return 0;
6611 }
6612 }
6613 return 1;
6614 }
6615
6616 static int
6617 check_long_reg (void)
6618 {
6619 int op;
6620
6621 for (op = i.operands; --op >= 0;)
6622 /* Skip non-register operands. */
6623 if (i.types[op].bitfield.class != Reg)
6624 continue;
6625 /* Reject eight bit registers, except where the template requires
6626 them. (eg. movzb) */
6627 else if (i.types[op].bitfield.byte
6628 && (i.tm.operand_types[op].bitfield.class == Reg
6629 || i.tm.operand_types[op].bitfield.acc)
6630 && (i.tm.operand_types[op].bitfield.word
6631 || i.tm.operand_types[op].bitfield.dword))
6632 {
6633 as_bad (_("`%s%s' not allowed with `%s%c'"),
6634 register_prefix,
6635 i.op[op].regs->reg_name,
6636 i.tm.name,
6637 i.suffix);
6638 return 0;
6639 }
6640 /* Warn if the e prefix on a general reg is missing. */
6641 else if ((!quiet_warnings || flag_code == CODE_64BIT)
6642 && i.types[op].bitfield.word
6643 && (i.tm.operand_types[op].bitfield.class == Reg
6644 || i.tm.operand_types[op].bitfield.acc)
6645 && i.tm.operand_types[op].bitfield.dword)
6646 {
6647 /* Prohibit these changes in the 64bit mode, since the
6648 lowering is more complicated. */
6649 if (flag_code == CODE_64BIT)
6650 {
6651 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
6652 register_prefix, i.op[op].regs->reg_name,
6653 i.suffix);
6654 return 0;
6655 }
6656 #if REGISTER_WARNINGS
6657 as_warn (_("using `%s%s' instead of `%s%s' due to `%c' suffix"),
6658 register_prefix,
6659 (i.op[op].regs + REGNAM_EAX - REGNAM_AX)->reg_name,
6660 register_prefix, i.op[op].regs->reg_name, i.suffix);
6661 #endif
6662 }
6663 /* Warn if the r prefix on a general reg is present. */
6664 else if (i.types[op].bitfield.qword
6665 && (i.tm.operand_types[op].bitfield.class == Reg
6666 || i.tm.operand_types[op].bitfield.acc)
6667 && i.tm.operand_types[op].bitfield.dword)
6668 {
6669 if (intel_syntax
6670 && i.tm.opcode_modifier.toqword
6671 && i.types[0].bitfield.class != RegSIMD)
6672 {
6673 /* Convert to QWORD. We want REX byte. */
6674 i.suffix = QWORD_MNEM_SUFFIX;
6675 }
6676 else
6677 {
6678 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
6679 register_prefix, i.op[op].regs->reg_name,
6680 i.suffix);
6681 return 0;
6682 }
6683 }
6684 return 1;
6685 }
6686
6687 static int
6688 check_qword_reg (void)
6689 {
6690 int op;
6691
6692 for (op = i.operands; --op >= 0; )
6693 /* Skip non-register operands. */
6694 if (i.types[op].bitfield.class != Reg)
6695 continue;
6696 /* Reject eight bit registers, except where the template requires
6697 them. (eg. movzb) */
6698 else if (i.types[op].bitfield.byte
6699 && (i.tm.operand_types[op].bitfield.class == Reg
6700 || i.tm.operand_types[op].bitfield.acc)
6701 && (i.tm.operand_types[op].bitfield.word
6702 || i.tm.operand_types[op].bitfield.dword))
6703 {
6704 as_bad (_("`%s%s' not allowed with `%s%c'"),
6705 register_prefix,
6706 i.op[op].regs->reg_name,
6707 i.tm.name,
6708 i.suffix);
6709 return 0;
6710 }
6711 /* Warn if the r prefix on a general reg is missing. */
6712 else if ((i.types[op].bitfield.word
6713 || i.types[op].bitfield.dword)
6714 && (i.tm.operand_types[op].bitfield.class == Reg
6715 || i.tm.operand_types[op].bitfield.acc)
6716 && i.tm.operand_types[op].bitfield.qword)
6717 {
6718 /* Prohibit these changes in the 64bit mode, since the
6719 lowering is more complicated. */
6720 if (intel_syntax
6721 && i.tm.opcode_modifier.todword
6722 && i.types[0].bitfield.class != RegSIMD)
6723 {
6724 /* Convert to DWORD. We don't want REX byte. */
6725 i.suffix = LONG_MNEM_SUFFIX;
6726 }
6727 else
6728 {
6729 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
6730 register_prefix, i.op[op].regs->reg_name,
6731 i.suffix);
6732 return 0;
6733 }
6734 }
6735 return 1;
6736 }
6737
6738 static int
6739 check_word_reg (void)
6740 {
6741 int op;
6742 for (op = i.operands; --op >= 0;)
6743 /* Skip non-register operands. */
6744 if (i.types[op].bitfield.class != Reg)
6745 continue;
6746 /* Reject eight bit registers, except where the template requires
6747 them. (eg. movzb) */
6748 else if (i.types[op].bitfield.byte
6749 && (i.tm.operand_types[op].bitfield.class == Reg
6750 || i.tm.operand_types[op].bitfield.acc)
6751 && (i.tm.operand_types[op].bitfield.word
6752 || i.tm.operand_types[op].bitfield.dword))
6753 {
6754 as_bad (_("`%s%s' not allowed with `%s%c'"),
6755 register_prefix,
6756 i.op[op].regs->reg_name,
6757 i.tm.name,
6758 i.suffix);
6759 return 0;
6760 }
6761 /* Warn if the e or r prefix on a general reg is present. */
6762 else if ((!quiet_warnings || flag_code == CODE_64BIT)
6763 && (i.types[op].bitfield.dword
6764 || i.types[op].bitfield.qword)
6765 && (i.tm.operand_types[op].bitfield.class == Reg
6766 || i.tm.operand_types[op].bitfield.acc)
6767 && i.tm.operand_types[op].bitfield.word)
6768 {
6769 /* Prohibit these changes in the 64bit mode, since the
6770 lowering is more complicated. */
6771 if (flag_code == CODE_64BIT)
6772 {
6773 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
6774 register_prefix, i.op[op].regs->reg_name,
6775 i.suffix);
6776 return 0;
6777 }
6778 #if REGISTER_WARNINGS
6779 as_warn (_("using `%s%s' instead of `%s%s' due to `%c' suffix"),
6780 register_prefix,
6781 (i.op[op].regs + REGNAM_AX - REGNAM_EAX)->reg_name,
6782 register_prefix, i.op[op].regs->reg_name, i.suffix);
6783 #endif
6784 }
6785 return 1;
6786 }
6787
6788 static int
6789 update_imm (unsigned int j)
6790 {
6791 i386_operand_type overlap = i.types[j];
6792 if ((overlap.bitfield.imm8
6793 || overlap.bitfield.imm8s
6794 || overlap.bitfield.imm16
6795 || overlap.bitfield.imm32
6796 || overlap.bitfield.imm32s
6797 || overlap.bitfield.imm64)
6798 && !operand_type_equal (&overlap, &imm8)
6799 && !operand_type_equal (&overlap, &imm8s)
6800 && !operand_type_equal (&overlap, &imm16)
6801 && !operand_type_equal (&overlap, &imm32)
6802 && !operand_type_equal (&overlap, &imm32s)
6803 && !operand_type_equal (&overlap, &imm64))
6804 {
6805 if (i.suffix)
6806 {
6807 i386_operand_type temp;
6808
6809 operand_type_set (&temp, 0);
6810 if (i.suffix == BYTE_MNEM_SUFFIX)
6811 {
6812 temp.bitfield.imm8 = overlap.bitfield.imm8;
6813 temp.bitfield.imm8s = overlap.bitfield.imm8s;
6814 }
6815 else if (i.suffix == WORD_MNEM_SUFFIX)
6816 temp.bitfield.imm16 = overlap.bitfield.imm16;
6817 else if (i.suffix == QWORD_MNEM_SUFFIX)
6818 {
6819 temp.bitfield.imm64 = overlap.bitfield.imm64;
6820 temp.bitfield.imm32s = overlap.bitfield.imm32s;
6821 }
6822 else
6823 temp.bitfield.imm32 = overlap.bitfield.imm32;
6824 overlap = temp;
6825 }
6826 else if (operand_type_equal (&overlap, &imm16_32_32s)
6827 || operand_type_equal (&overlap, &imm16_32)
6828 || operand_type_equal (&overlap, &imm16_32s))
6829 {
6830 if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
6831 overlap = imm16;
6832 else
6833 overlap = imm32s;
6834 }
6835 if (!operand_type_equal (&overlap, &imm8)
6836 && !operand_type_equal (&overlap, &imm8s)
6837 && !operand_type_equal (&overlap, &imm16)
6838 && !operand_type_equal (&overlap, &imm32)
6839 && !operand_type_equal (&overlap, &imm32s)
6840 && !operand_type_equal (&overlap, &imm64))
6841 {
6842 as_bad (_("no instruction mnemonic suffix given; "
6843 "can't determine immediate size"));
6844 return 0;
6845 }
6846 }
6847 i.types[j] = overlap;
6848
6849 return 1;
6850 }
6851
6852 static int
6853 finalize_imm (void)
6854 {
6855 unsigned int j, n;
6856
6857 /* Update the first 2 immediate operands. */
6858 n = i.operands > 2 ? 2 : i.operands;
6859 if (n)
6860 {
6861 for (j = 0; j < n; j++)
6862 if (update_imm (j) == 0)
6863 return 0;
6864
6865 /* The 3rd operand can't be immediate operand. */
6866 gas_assert (operand_type_check (i.types[2], imm) == 0);
6867 }
6868
6869 return 1;
6870 }
6871
6872 static int
6873 process_operands (void)
6874 {
6875 /* Default segment register this instruction will use for memory
6876 accesses. 0 means unknown. This is only for optimizing out
6877 unnecessary segment overrides. */
6878 const seg_entry *default_seg = 0;
6879
6880 if (i.tm.opcode_modifier.sse2avx && i.tm.opcode_modifier.vexvvvv)
6881 {
6882 unsigned int dupl = i.operands;
6883 unsigned int dest = dupl - 1;
6884 unsigned int j;
6885
6886 /* The destination must be an xmm register. */
6887 gas_assert (i.reg_operands
6888 && MAX_OPERANDS > dupl
6889 && operand_type_equal (&i.types[dest], &regxmm));
6890
6891 if (i.tm.operand_types[0].bitfield.acc
6892 && i.tm.operand_types[0].bitfield.xmmword)
6893 {
6894 if (i.tm.opcode_modifier.vexsources == VEX3SOURCES)
6895 {
6896 /* Keep xmm0 for instructions with VEX prefix and 3
6897 sources. */
6898 i.tm.operand_types[0].bitfield.acc = 0;
6899 i.tm.operand_types[0].bitfield.class = RegSIMD;
6900 goto duplicate;
6901 }
6902 else
6903 {
6904 /* We remove the first xmm0 and keep the number of
6905 operands unchanged, which in fact duplicates the
6906 destination. */
6907 for (j = 1; j < i.operands; j++)
6908 {
6909 i.op[j - 1] = i.op[j];
6910 i.types[j - 1] = i.types[j];
6911 i.tm.operand_types[j - 1] = i.tm.operand_types[j];
6912 i.flags[j - 1] = i.flags[j];
6913 }
6914 }
6915 }
6916 else if (i.tm.opcode_modifier.implicit1stxmm0)
6917 {
6918 gas_assert ((MAX_OPERANDS - 1) > dupl
6919 && (i.tm.opcode_modifier.vexsources
6920 == VEX3SOURCES));
6921
6922 /* Add the implicit xmm0 for instructions with VEX prefix
6923 and 3 sources. */
6924 for (j = i.operands; j > 0; j--)
6925 {
6926 i.op[j] = i.op[j - 1];
6927 i.types[j] = i.types[j - 1];
6928 i.tm.operand_types[j] = i.tm.operand_types[j - 1];
6929 i.flags[j] = i.flags[j - 1];
6930 }
6931 i.op[0].regs
6932 = (const reg_entry *) hash_find (reg_hash, "xmm0");
6933 i.types[0] = regxmm;
6934 i.tm.operand_types[0] = regxmm;
6935
6936 i.operands += 2;
6937 i.reg_operands += 2;
6938 i.tm.operands += 2;
6939
6940 dupl++;
6941 dest++;
6942 i.op[dupl] = i.op[dest];
6943 i.types[dupl] = i.types[dest];
6944 i.tm.operand_types[dupl] = i.tm.operand_types[dest];
6945 i.flags[dupl] = i.flags[dest];
6946 }
6947 else
6948 {
6949 duplicate:
6950 i.operands++;
6951 i.reg_operands++;
6952 i.tm.operands++;
6953
6954 i.op[dupl] = i.op[dest];
6955 i.types[dupl] = i.types[dest];
6956 i.tm.operand_types[dupl] = i.tm.operand_types[dest];
6957 i.flags[dupl] = i.flags[dest];
6958 }
6959
6960 if (i.tm.opcode_modifier.immext)
6961 process_immext ();
6962 }
6963 else if (i.tm.operand_types[0].bitfield.acc
6964 && i.tm.operand_types[0].bitfield.xmmword)
6965 {
6966 unsigned int j;
6967
6968 for (j = 1; j < i.operands; j++)
6969 {
6970 i.op[j - 1] = i.op[j];
6971 i.types[j - 1] = i.types[j];
6972
6973 /* We need to adjust fields in i.tm since they are used by
6974 build_modrm_byte. */
6975 i.tm.operand_types [j - 1] = i.tm.operand_types [j];
6976
6977 i.flags[j - 1] = i.flags[j];
6978 }
6979
6980 i.operands--;
6981 i.reg_operands--;
6982 i.tm.operands--;
6983 }
6984 else if (i.tm.opcode_modifier.implicitquadgroup)
6985 {
6986 unsigned int regnum, first_reg_in_group, last_reg_in_group;
6987
6988 /* The second operand must be {x,y,z}mmN, where N is a multiple of 4. */
6989 gas_assert (i.operands >= 2 && i.types[1].bitfield.class == RegSIMD);
6990 regnum = register_number (i.op[1].regs);
6991 first_reg_in_group = regnum & ~3;
6992 last_reg_in_group = first_reg_in_group + 3;
6993 if (regnum != first_reg_in_group)
6994 as_warn (_("source register `%s%s' implicitly denotes"
6995 " `%s%.3s%u' to `%s%.3s%u' source group in `%s'"),
6996 register_prefix, i.op[1].regs->reg_name,
6997 register_prefix, i.op[1].regs->reg_name, first_reg_in_group,
6998 register_prefix, i.op[1].regs->reg_name, last_reg_in_group,
6999 i.tm.name);
7000 }
7001 else if (i.tm.opcode_modifier.regkludge)
7002 {
7003 /* The imul $imm, %reg instruction is converted into
7004 imul $imm, %reg, %reg, and the clr %reg instruction
7005 is converted into xor %reg, %reg. */
7006
7007 unsigned int first_reg_op;
7008
7009 if (operand_type_check (i.types[0], reg))
7010 first_reg_op = 0;
7011 else
7012 first_reg_op = 1;
7013 /* Pretend we saw the extra register operand. */
7014 gas_assert (i.reg_operands == 1
7015 && i.op[first_reg_op + 1].regs == 0);
7016 i.op[first_reg_op + 1].regs = i.op[first_reg_op].regs;
7017 i.types[first_reg_op + 1] = i.types[first_reg_op];
7018 i.operands++;
7019 i.reg_operands++;
7020 }
7021
7022 if (i.tm.opcode_modifier.modrm)
7023 {
7024 /* The opcode is completed (modulo i.tm.extension_opcode which
7025 must be put into the modrm byte). Now, we make the modrm and
7026 index base bytes based on all the info we've collected. */
7027
7028 default_seg = build_modrm_byte ();
7029 }
7030 else if (i.types[0].bitfield.class == SReg)
7031 {
7032 if (flag_code != CODE_64BIT
7033 ? i.tm.base_opcode == POP_SEG_SHORT
7034 && i.op[0].regs->reg_num == 1
7035 : (i.tm.base_opcode | 1) == POP_SEG386_SHORT
7036 && i.op[0].regs->reg_num < 4)
7037 {
7038 as_bad (_("you can't `%s %s%s'"),
7039 i.tm.name, register_prefix, i.op[0].regs->reg_name);
7040 return 0;
7041 }
7042 if ( i.op[0].regs->reg_num > 3 && i.tm.opcode_length == 1 )
7043 {
7044 i.tm.base_opcode ^= POP_SEG_SHORT ^ POP_SEG386_SHORT;
7045 i.tm.opcode_length = 2;
7046 }
7047 i.tm.base_opcode |= (i.op[0].regs->reg_num << 3);
7048 }
7049 else if ((i.tm.base_opcode & ~0x3) == MOV_AX_DISP32)
7050 {
7051 default_seg = &ds;
7052 }
7053 else if (i.tm.opcode_modifier.isstring)
7054 {
7055 /* For the string instructions that allow a segment override
7056 on one of their operands, the default segment is ds. */
7057 default_seg = &ds;
7058 }
7059 else if (i.tm.opcode_modifier.shortform)
7060 {
7061 /* The register or float register operand is in operand
7062 0 or 1. */
7063 unsigned int op = i.tm.operand_types[0].bitfield.class != Reg;
7064
7065 /* Register goes in low 3 bits of opcode. */
7066 i.tm.base_opcode |= i.op[op].regs->reg_num;
7067 if ((i.op[op].regs->reg_flags & RegRex) != 0)
7068 i.rex |= REX_B;
7069 if (!quiet_warnings && i.tm.opcode_modifier.ugh)
7070 {
7071 /* Warn about some common errors, but press on regardless.
7072 The first case can be generated by gcc (<= 2.8.1). */
7073 if (i.operands == 2)
7074 {
7075 /* Reversed arguments on faddp, fsubp, etc. */
7076 as_warn (_("translating to `%s %s%s,%s%s'"), i.tm.name,
7077 register_prefix, i.op[!intel_syntax].regs->reg_name,
7078 register_prefix, i.op[intel_syntax].regs->reg_name);
7079 }
7080 else
7081 {
7082 /* Extraneous `l' suffix on fp insn. */
7083 as_warn (_("translating to `%s %s%s'"), i.tm.name,
7084 register_prefix, i.op[0].regs->reg_name);
7085 }
7086 }
7087 }
7088
7089 if (i.tm.base_opcode == 0x8d /* lea */
7090 && i.seg[0]
7091 && !quiet_warnings)
7092 as_warn (_("segment override on `%s' is ineffectual"), i.tm.name);
7093
7094 /* If a segment was explicitly specified, and the specified segment
7095 is not the default, use an opcode prefix to select it. If we
7096 never figured out what the default segment is, then default_seg
7097 will be zero at this point, and the specified segment prefix will
7098 always be used. */
7099 if ((i.seg[0]) && (i.seg[0] != default_seg))
7100 {
7101 if (!add_prefix (i.seg[0]->seg_prefix))
7102 return 0;
7103 }
7104 return 1;
7105 }
7106
7107 static const seg_entry *
7108 build_modrm_byte (void)
7109 {
7110 const seg_entry *default_seg = 0;
7111 unsigned int source, dest;
7112 int vex_3_sources;
7113
7114 vex_3_sources = i.tm.opcode_modifier.vexsources == VEX3SOURCES;
7115 if (vex_3_sources)
7116 {
7117 unsigned int nds, reg_slot;
7118 expressionS *exp;
7119
7120 dest = i.operands - 1;
7121 nds = dest - 1;
7122
7123 /* There are 2 kinds of instructions:
7124 1. 5 operands: 4 register operands or 3 register operands
7125 plus 1 memory operand plus one Imm4 operand, VexXDS, and
7126 VexW0 or VexW1. The destination must be either XMM, YMM or
7127 ZMM register.
7128 2. 4 operands: 4 register operands or 3 register operands
7129 plus 1 memory operand, with VexXDS. */
7130 gas_assert ((i.reg_operands == 4
7131 || (i.reg_operands == 3 && i.mem_operands == 1))
7132 && i.tm.opcode_modifier.vexvvvv == VEXXDS
7133 && i.tm.opcode_modifier.vexw
7134 && i.tm.operand_types[dest].bitfield.class == RegSIMD);
7135
7136 /* If VexW1 is set, the first non-immediate operand is the source and
7137 the second non-immediate one is encoded in the immediate operand. */
7138 if (i.tm.opcode_modifier.vexw == VEXW1)
7139 {
7140 source = i.imm_operands;
7141 reg_slot = i.imm_operands + 1;
7142 }
7143 else
7144 {
7145 source = i.imm_operands + 1;
7146 reg_slot = i.imm_operands;
7147 }
7148
7149 if (i.imm_operands == 0)
7150 {
7151 /* When there is no immediate operand, generate an 8bit
7152 immediate operand to encode the first operand. */
7153 exp = &im_expressions[i.imm_operands++];
7154 i.op[i.operands].imms = exp;
7155 i.types[i.operands] = imm8;
7156 i.operands++;
7157
7158 gas_assert (i.tm.operand_types[reg_slot].bitfield.class == RegSIMD);
7159 exp->X_op = O_constant;
7160 exp->X_add_number = register_number (i.op[reg_slot].regs) << 4;
7161 gas_assert ((i.op[reg_slot].regs->reg_flags & RegVRex) == 0);
7162 }
7163 else
7164 {
7165 gas_assert (i.imm_operands == 1);
7166 gas_assert (fits_in_imm4 (i.op[0].imms->X_add_number));
7167 gas_assert (!i.tm.opcode_modifier.immext);
7168
7169 /* Turn on Imm8 again so that output_imm will generate it. */
7170 i.types[0].bitfield.imm8 = 1;
7171
7172 gas_assert (i.tm.operand_types[reg_slot].bitfield.class == RegSIMD);
7173 i.op[0].imms->X_add_number
7174 |= register_number (i.op[reg_slot].regs) << 4;
7175 gas_assert ((i.op[reg_slot].regs->reg_flags & RegVRex) == 0);
7176 }
7177
7178 gas_assert (i.tm.operand_types[nds].bitfield.class == RegSIMD);
7179 i.vex.register_specifier = i.op[nds].regs;
7180 }
7181 else
7182 source = dest = 0;
7183
7184 /* i.reg_operands MUST be the number of real register operands;
7185 implicit registers do not count. If there are 3 register
7186 operands, it must be a instruction with VexNDS. For a
7187 instruction with VexNDD, the destination register is encoded
7188 in VEX prefix. If there are 4 register operands, it must be
7189 a instruction with VEX prefix and 3 sources. */
7190 if (i.mem_operands == 0
7191 && ((i.reg_operands == 2
7192 && i.tm.opcode_modifier.vexvvvv <= VEXXDS)
7193 || (i.reg_operands == 3
7194 && i.tm.opcode_modifier.vexvvvv == VEXXDS)
7195 || (i.reg_operands == 4 && vex_3_sources)))
7196 {
7197 switch (i.operands)
7198 {
7199 case 2:
7200 source = 0;
7201 break;
7202 case 3:
7203 /* When there are 3 operands, one of them may be immediate,
7204 which may be the first or the last operand. Otherwise,
7205 the first operand must be shift count register (cl) or it
7206 is an instruction with VexNDS. */
7207 gas_assert (i.imm_operands == 1
7208 || (i.imm_operands == 0
7209 && (i.tm.opcode_modifier.vexvvvv == VEXXDS
7210 || i.types[0].bitfield.shiftcount)));
7211 if (operand_type_check (i.types[0], imm)
7212 || i.types[0].bitfield.shiftcount)
7213 source = 1;
7214 else
7215 source = 0;
7216 break;
7217 case 4:
7218 /* When there are 4 operands, the first two must be 8bit
7219 immediate operands. The source operand will be the 3rd
7220 one.
7221
7222 For instructions with VexNDS, if the first operand
7223 an imm8, the source operand is the 2nd one. If the last
7224 operand is imm8, the source operand is the first one. */
7225 gas_assert ((i.imm_operands == 2
7226 && i.types[0].bitfield.imm8
7227 && i.types[1].bitfield.imm8)
7228 || (i.tm.opcode_modifier.vexvvvv == VEXXDS
7229 && i.imm_operands == 1
7230 && (i.types[0].bitfield.imm8
7231 || i.types[i.operands - 1].bitfield.imm8
7232 || i.rounding)));
7233 if (i.imm_operands == 2)
7234 source = 2;
7235 else
7236 {
7237 if (i.types[0].bitfield.imm8)
7238 source = 1;
7239 else
7240 source = 0;
7241 }
7242 break;
7243 case 5:
7244 if (is_evex_encoding (&i.tm))
7245 {
7246 /* For EVEX instructions, when there are 5 operands, the
7247 first one must be immediate operand. If the second one
7248 is immediate operand, the source operand is the 3th
7249 one. If the last one is immediate operand, the source
7250 operand is the 2nd one. */
7251 gas_assert (i.imm_operands == 2
7252 && i.tm.opcode_modifier.sae
7253 && operand_type_check (i.types[0], imm));
7254 if (operand_type_check (i.types[1], imm))
7255 source = 2;
7256 else if (operand_type_check (i.types[4], imm))
7257 source = 1;
7258 else
7259 abort ();
7260 }
7261 break;
7262 default:
7263 abort ();
7264 }
7265
7266 if (!vex_3_sources)
7267 {
7268 dest = source + 1;
7269
7270 /* RC/SAE operand could be between DEST and SRC. That happens
7271 when one operand is GPR and the other one is XMM/YMM/ZMM
7272 register. */
7273 if (i.rounding && i.rounding->operand == (int) dest)
7274 dest++;
7275
7276 if (i.tm.opcode_modifier.vexvvvv == VEXXDS)
7277 {
7278 /* For instructions with VexNDS, the register-only source
7279 operand must be a 32/64bit integer, XMM, YMM, ZMM, or mask
7280 register. It is encoded in VEX prefix. */
7281
7282 i386_operand_type op;
7283 unsigned int vvvv;
7284
7285 /* Check register-only source operand when two source
7286 operands are swapped. */
7287 if (!i.tm.operand_types[source].bitfield.baseindex
7288 && i.tm.operand_types[dest].bitfield.baseindex)
7289 {
7290 vvvv = source;
7291 source = dest;
7292 }
7293 else
7294 vvvv = dest;
7295
7296 op = i.tm.operand_types[vvvv];
7297 if ((dest + 1) >= i.operands
7298 || ((op.bitfield.class != Reg
7299 || (!op.bitfield.dword && !op.bitfield.qword))
7300 && op.bitfield.class != RegSIMD
7301 && !operand_type_equal (&op, &regmask)))
7302 abort ();
7303 i.vex.register_specifier = i.op[vvvv].regs;
7304 dest++;
7305 }
7306 }
7307
7308 i.rm.mode = 3;
7309 /* One of the register operands will be encoded in the i.rm.reg
7310 field, the other in the combined i.rm.mode and i.rm.regmem
7311 fields. If no form of this instruction supports a memory
7312 destination operand, then we assume the source operand may
7313 sometimes be a memory operand and so we need to store the
7314 destination in the i.rm.reg field. */
7315 if (!i.tm.opcode_modifier.regmem
7316 && operand_type_check (i.tm.operand_types[dest], anymem) == 0)
7317 {
7318 i.rm.reg = i.op[dest].regs->reg_num;
7319 i.rm.regmem = i.op[source].regs->reg_num;
7320 if (i.op[dest].regs->reg_type.bitfield.class == RegMMX
7321 || i.op[source].regs->reg_type.bitfield.class == RegMMX)
7322 i.has_regmmx = TRUE;
7323 else if (i.op[dest].regs->reg_type.bitfield.class == RegSIMD
7324 || i.op[source].regs->reg_type.bitfield.class == RegSIMD)
7325 {
7326 if (i.types[dest].bitfield.zmmword
7327 || i.types[source].bitfield.zmmword)
7328 i.has_regzmm = TRUE;
7329 else if (i.types[dest].bitfield.ymmword
7330 || i.types[source].bitfield.ymmword)
7331 i.has_regymm = TRUE;
7332 else
7333 i.has_regxmm = TRUE;
7334 }
7335 if ((i.op[dest].regs->reg_flags & RegRex) != 0)
7336 i.rex |= REX_R;
7337 if ((i.op[dest].regs->reg_flags & RegVRex) != 0)
7338 i.vrex |= REX_R;
7339 if ((i.op[source].regs->reg_flags & RegRex) != 0)
7340 i.rex |= REX_B;
7341 if ((i.op[source].regs->reg_flags & RegVRex) != 0)
7342 i.vrex |= REX_B;
7343 }
7344 else
7345 {
7346 i.rm.reg = i.op[source].regs->reg_num;
7347 i.rm.regmem = i.op[dest].regs->reg_num;
7348 if ((i.op[dest].regs->reg_flags & RegRex) != 0)
7349 i.rex |= REX_B;
7350 if ((i.op[dest].regs->reg_flags & RegVRex) != 0)
7351 i.vrex |= REX_B;
7352 if ((i.op[source].regs->reg_flags & RegRex) != 0)
7353 i.rex |= REX_R;
7354 if ((i.op[source].regs->reg_flags & RegVRex) != 0)
7355 i.vrex |= REX_R;
7356 }
7357 if (flag_code != CODE_64BIT && (i.rex & REX_R))
7358 {
7359 if (i.types[!i.tm.opcode_modifier.regmem].bitfield.class != RegCR)
7360 abort ();
7361 i.rex &= ~REX_R;
7362 add_prefix (LOCK_PREFIX_OPCODE);
7363 }
7364 }
7365 else
7366 { /* If it's not 2 reg operands... */
7367 unsigned int mem;
7368
7369 if (i.mem_operands)
7370 {
7371 unsigned int fake_zero_displacement = 0;
7372 unsigned int op;
7373
7374 for (op = 0; op < i.operands; op++)
7375 if (i.flags[op] & Operand_Mem)
7376 break;
7377 gas_assert (op < i.operands);
7378
7379 if (i.tm.opcode_modifier.vecsib)
7380 {
7381 if (i.index_reg->reg_num == RegIZ)
7382 abort ();
7383
7384 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
7385 if (!i.base_reg)
7386 {
7387 i.sib.base = NO_BASE_REGISTER;
7388 i.sib.scale = i.log2_scale_factor;
7389 i.types[op].bitfield.disp8 = 0;
7390 i.types[op].bitfield.disp16 = 0;
7391 i.types[op].bitfield.disp64 = 0;
7392 if (flag_code != CODE_64BIT || i.prefix[ADDR_PREFIX])
7393 {
7394 /* Must be 32 bit */
7395 i.types[op].bitfield.disp32 = 1;
7396 i.types[op].bitfield.disp32s = 0;
7397 }
7398 else
7399 {
7400 i.types[op].bitfield.disp32 = 0;
7401 i.types[op].bitfield.disp32s = 1;
7402 }
7403 }
7404 i.sib.index = i.index_reg->reg_num;
7405 if ((i.index_reg->reg_flags & RegRex) != 0)
7406 i.rex |= REX_X;
7407 if ((i.index_reg->reg_flags & RegVRex) != 0)
7408 i.vrex |= REX_X;
7409 }
7410
7411 default_seg = &ds;
7412
7413 if (i.base_reg == 0)
7414 {
7415 i.rm.mode = 0;
7416 if (!i.disp_operands)
7417 fake_zero_displacement = 1;
7418 if (i.index_reg == 0)
7419 {
7420 i386_operand_type newdisp;
7421
7422 gas_assert (!i.tm.opcode_modifier.vecsib);
7423 /* Operand is just <disp> */
7424 if (flag_code == CODE_64BIT)
7425 {
7426 /* 64bit mode overwrites the 32bit absolute
7427 addressing by RIP relative addressing and
7428 absolute addressing is encoded by one of the
7429 redundant SIB forms. */
7430 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
7431 i.sib.base = NO_BASE_REGISTER;
7432 i.sib.index = NO_INDEX_REGISTER;
7433 newdisp = (!i.prefix[ADDR_PREFIX] ? disp32s : disp32);
7434 }
7435 else if ((flag_code == CODE_16BIT)
7436 ^ (i.prefix[ADDR_PREFIX] != 0))
7437 {
7438 i.rm.regmem = NO_BASE_REGISTER_16;
7439 newdisp = disp16;
7440 }
7441 else
7442 {
7443 i.rm.regmem = NO_BASE_REGISTER;
7444 newdisp = disp32;
7445 }
7446 i.types[op] = operand_type_and_not (i.types[op], anydisp);
7447 i.types[op] = operand_type_or (i.types[op], newdisp);
7448 }
7449 else if (!i.tm.opcode_modifier.vecsib)
7450 {
7451 /* !i.base_reg && i.index_reg */
7452 if (i.index_reg->reg_num == RegIZ)
7453 i.sib.index = NO_INDEX_REGISTER;
7454 else
7455 i.sib.index = i.index_reg->reg_num;
7456 i.sib.base = NO_BASE_REGISTER;
7457 i.sib.scale = i.log2_scale_factor;
7458 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
7459 i.types[op].bitfield.disp8 = 0;
7460 i.types[op].bitfield.disp16 = 0;
7461 i.types[op].bitfield.disp64 = 0;
7462 if (flag_code != CODE_64BIT || i.prefix[ADDR_PREFIX])
7463 {
7464 /* Must be 32 bit */
7465 i.types[op].bitfield.disp32 = 1;
7466 i.types[op].bitfield.disp32s = 0;
7467 }
7468 else
7469 {
7470 i.types[op].bitfield.disp32 = 0;
7471 i.types[op].bitfield.disp32s = 1;
7472 }
7473 if ((i.index_reg->reg_flags & RegRex) != 0)
7474 i.rex |= REX_X;
7475 }
7476 }
7477 /* RIP addressing for 64bit mode. */
7478 else if (i.base_reg->reg_num == RegIP)
7479 {
7480 gas_assert (!i.tm.opcode_modifier.vecsib);
7481 i.rm.regmem = NO_BASE_REGISTER;
7482 i.types[op].bitfield.disp8 = 0;
7483 i.types[op].bitfield.disp16 = 0;
7484 i.types[op].bitfield.disp32 = 0;
7485 i.types[op].bitfield.disp32s = 1;
7486 i.types[op].bitfield.disp64 = 0;
7487 i.flags[op] |= Operand_PCrel;
7488 if (! i.disp_operands)
7489 fake_zero_displacement = 1;
7490 }
7491 else if (i.base_reg->reg_type.bitfield.word)
7492 {
7493 gas_assert (!i.tm.opcode_modifier.vecsib);
7494 switch (i.base_reg->reg_num)
7495 {
7496 case 3: /* (%bx) */
7497 if (i.index_reg == 0)
7498 i.rm.regmem = 7;
7499 else /* (%bx,%si) -> 0, or (%bx,%di) -> 1 */
7500 i.rm.regmem = i.index_reg->reg_num - 6;
7501 break;
7502 case 5: /* (%bp) */
7503 default_seg = &ss;
7504 if (i.index_reg == 0)
7505 {
7506 i.rm.regmem = 6;
7507 if (operand_type_check (i.types[op], disp) == 0)
7508 {
7509 /* fake (%bp) into 0(%bp) */
7510 i.types[op].bitfield.disp8 = 1;
7511 fake_zero_displacement = 1;
7512 }
7513 }
7514 else /* (%bp,%si) -> 2, or (%bp,%di) -> 3 */
7515 i.rm.regmem = i.index_reg->reg_num - 6 + 2;
7516 break;
7517 default: /* (%si) -> 4 or (%di) -> 5 */
7518 i.rm.regmem = i.base_reg->reg_num - 6 + 4;
7519 }
7520 i.rm.mode = mode_from_disp_size (i.types[op]);
7521 }
7522 else /* i.base_reg and 32/64 bit mode */
7523 {
7524 if (flag_code == CODE_64BIT
7525 && operand_type_check (i.types[op], disp))
7526 {
7527 i.types[op].bitfield.disp16 = 0;
7528 i.types[op].bitfield.disp64 = 0;
7529 if (i.prefix[ADDR_PREFIX] == 0)
7530 {
7531 i.types[op].bitfield.disp32 = 0;
7532 i.types[op].bitfield.disp32s = 1;
7533 }
7534 else
7535 {
7536 i.types[op].bitfield.disp32 = 1;
7537 i.types[op].bitfield.disp32s = 0;
7538 }
7539 }
7540
7541 if (!i.tm.opcode_modifier.vecsib)
7542 i.rm.regmem = i.base_reg->reg_num;
7543 if ((i.base_reg->reg_flags & RegRex) != 0)
7544 i.rex |= REX_B;
7545 i.sib.base = i.base_reg->reg_num;
7546 /* x86-64 ignores REX prefix bit here to avoid decoder
7547 complications. */
7548 if (!(i.base_reg->reg_flags & RegRex)
7549 && (i.base_reg->reg_num == EBP_REG_NUM
7550 || i.base_reg->reg_num == ESP_REG_NUM))
7551 default_seg = &ss;
7552 if (i.base_reg->reg_num == 5 && i.disp_operands == 0)
7553 {
7554 fake_zero_displacement = 1;
7555 i.types[op].bitfield.disp8 = 1;
7556 }
7557 i.sib.scale = i.log2_scale_factor;
7558 if (i.index_reg == 0)
7559 {
7560 gas_assert (!i.tm.opcode_modifier.vecsib);
7561 /* <disp>(%esp) becomes two byte modrm with no index
7562 register. We've already stored the code for esp
7563 in i.rm.regmem ie. ESCAPE_TO_TWO_BYTE_ADDRESSING.
7564 Any base register besides %esp will not use the
7565 extra modrm byte. */
7566 i.sib.index = NO_INDEX_REGISTER;
7567 }
7568 else if (!i.tm.opcode_modifier.vecsib)
7569 {
7570 if (i.index_reg->reg_num == RegIZ)
7571 i.sib.index = NO_INDEX_REGISTER;
7572 else
7573 i.sib.index = i.index_reg->reg_num;
7574 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
7575 if ((i.index_reg->reg_flags & RegRex) != 0)
7576 i.rex |= REX_X;
7577 }
7578
7579 if (i.disp_operands
7580 && (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
7581 || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL))
7582 i.rm.mode = 0;
7583 else
7584 {
7585 if (!fake_zero_displacement
7586 && !i.disp_operands
7587 && i.disp_encoding)
7588 {
7589 fake_zero_displacement = 1;
7590 if (i.disp_encoding == disp_encoding_8bit)
7591 i.types[op].bitfield.disp8 = 1;
7592 else
7593 i.types[op].bitfield.disp32 = 1;
7594 }
7595 i.rm.mode = mode_from_disp_size (i.types[op]);
7596 }
7597 }
7598
7599 if (fake_zero_displacement)
7600 {
7601 /* Fakes a zero displacement assuming that i.types[op]
7602 holds the correct displacement size. */
7603 expressionS *exp;
7604
7605 gas_assert (i.op[op].disps == 0);
7606 exp = &disp_expressions[i.disp_operands++];
7607 i.op[op].disps = exp;
7608 exp->X_op = O_constant;
7609 exp->X_add_number = 0;
7610 exp->X_add_symbol = (symbolS *) 0;
7611 exp->X_op_symbol = (symbolS *) 0;
7612 }
7613
7614 mem = op;
7615 }
7616 else
7617 mem = ~0;
7618
7619 if (i.tm.opcode_modifier.vexsources == XOP2SOURCES)
7620 {
7621 if (operand_type_check (i.types[0], imm))
7622 i.vex.register_specifier = NULL;
7623 else
7624 {
7625 /* VEX.vvvv encodes one of the sources when the first
7626 operand is not an immediate. */
7627 if (i.tm.opcode_modifier.vexw == VEXW0)
7628 i.vex.register_specifier = i.op[0].regs;
7629 else
7630 i.vex.register_specifier = i.op[1].regs;
7631 }
7632
7633 /* Destination is a XMM register encoded in the ModRM.reg
7634 and VEX.R bit. */
7635 i.rm.reg = i.op[2].regs->reg_num;
7636 if ((i.op[2].regs->reg_flags & RegRex) != 0)
7637 i.rex |= REX_R;
7638
7639 /* ModRM.rm and VEX.B encodes the other source. */
7640 if (!i.mem_operands)
7641 {
7642 i.rm.mode = 3;
7643
7644 if (i.tm.opcode_modifier.vexw == VEXW0)
7645 i.rm.regmem = i.op[1].regs->reg_num;
7646 else
7647 i.rm.regmem = i.op[0].regs->reg_num;
7648
7649 if ((i.op[1].regs->reg_flags & RegRex) != 0)
7650 i.rex |= REX_B;
7651 }
7652 }
7653 else if (i.tm.opcode_modifier.vexvvvv == VEXLWP)
7654 {
7655 i.vex.register_specifier = i.op[2].regs;
7656 if (!i.mem_operands)
7657 {
7658 i.rm.mode = 3;
7659 i.rm.regmem = i.op[1].regs->reg_num;
7660 if ((i.op[1].regs->reg_flags & RegRex) != 0)
7661 i.rex |= REX_B;
7662 }
7663 }
7664 /* Fill in i.rm.reg or i.rm.regmem field with register operand
7665 (if any) based on i.tm.extension_opcode. Again, we must be
7666 careful to make sure that segment/control/debug/test/MMX
7667 registers are coded into the i.rm.reg field. */
7668 else if (i.reg_operands)
7669 {
7670 unsigned int op;
7671 unsigned int vex_reg = ~0;
7672
7673 for (op = 0; op < i.operands; op++)
7674 {
7675 if (i.types[op].bitfield.class == Reg
7676 || i.types[op].bitfield.class == RegBND
7677 || i.types[op].bitfield.class == RegMask
7678 || i.types[op].bitfield.class == SReg
7679 || i.types[op].bitfield.class == RegCR
7680 || i.types[op].bitfield.class == RegDR
7681 || i.types[op].bitfield.class == RegTR)
7682 break;
7683 if (i.types[op].bitfield.class == RegSIMD)
7684 {
7685 if (i.types[op].bitfield.zmmword)
7686 i.has_regzmm = TRUE;
7687 else if (i.types[op].bitfield.ymmword)
7688 i.has_regymm = TRUE;
7689 else
7690 i.has_regxmm = TRUE;
7691 break;
7692 }
7693 if (i.types[op].bitfield.class == RegMMX)
7694 {
7695 i.has_regmmx = TRUE;
7696 break;
7697 }
7698 }
7699
7700 if (vex_3_sources)
7701 op = dest;
7702 else if (i.tm.opcode_modifier.vexvvvv == VEXXDS)
7703 {
7704 /* For instructions with VexNDS, the register-only
7705 source operand is encoded in VEX prefix. */
7706 gas_assert (mem != (unsigned int) ~0);
7707
7708 if (op > mem)
7709 {
7710 vex_reg = op++;
7711 gas_assert (op < i.operands);
7712 }
7713 else
7714 {
7715 /* Check register-only source operand when two source
7716 operands are swapped. */
7717 if (!i.tm.operand_types[op].bitfield.baseindex
7718 && i.tm.operand_types[op + 1].bitfield.baseindex)
7719 {
7720 vex_reg = op;
7721 op += 2;
7722 gas_assert (mem == (vex_reg + 1)
7723 && op < i.operands);
7724 }
7725 else
7726 {
7727 vex_reg = op + 1;
7728 gas_assert (vex_reg < i.operands);
7729 }
7730 }
7731 }
7732 else if (i.tm.opcode_modifier.vexvvvv == VEXNDD)
7733 {
7734 /* For instructions with VexNDD, the register destination
7735 is encoded in VEX prefix. */
7736 if (i.mem_operands == 0)
7737 {
7738 /* There is no memory operand. */
7739 gas_assert ((op + 2) == i.operands);
7740 vex_reg = op + 1;
7741 }
7742 else
7743 {
7744 /* There are only 2 non-immediate operands. */
7745 gas_assert (op < i.imm_operands + 2
7746 && i.operands == i.imm_operands + 2);
7747 vex_reg = i.imm_operands + 1;
7748 }
7749 }
7750 else
7751 gas_assert (op < i.operands);
7752
7753 if (vex_reg != (unsigned int) ~0)
7754 {
7755 i386_operand_type *type = &i.tm.operand_types[vex_reg];
7756
7757 if ((type->bitfield.class != Reg
7758 || (!type->bitfield.dword && !type->bitfield.qword))
7759 && type->bitfield.class != RegSIMD
7760 && !operand_type_equal (type, &regmask))
7761 abort ();
7762
7763 i.vex.register_specifier = i.op[vex_reg].regs;
7764 }
7765
7766 /* Don't set OP operand twice. */
7767 if (vex_reg != op)
7768 {
7769 /* If there is an extension opcode to put here, the
7770 register number must be put into the regmem field. */
7771 if (i.tm.extension_opcode != None)
7772 {
7773 i.rm.regmem = i.op[op].regs->reg_num;
7774 if ((i.op[op].regs->reg_flags & RegRex) != 0)
7775 i.rex |= REX_B;
7776 if ((i.op[op].regs->reg_flags & RegVRex) != 0)
7777 i.vrex |= REX_B;
7778 }
7779 else
7780 {
7781 i.rm.reg = i.op[op].regs->reg_num;
7782 if ((i.op[op].regs->reg_flags & RegRex) != 0)
7783 i.rex |= REX_R;
7784 if ((i.op[op].regs->reg_flags & RegVRex) != 0)
7785 i.vrex |= REX_R;
7786 }
7787 }
7788
7789 /* Now, if no memory operand has set i.rm.mode = 0, 1, 2 we
7790 must set it to 3 to indicate this is a register operand
7791 in the regmem field. */
7792 if (!i.mem_operands)
7793 i.rm.mode = 3;
7794 }
7795
7796 /* Fill in i.rm.reg field with extension opcode (if any). */
7797 if (i.tm.extension_opcode != None)
7798 i.rm.reg = i.tm.extension_opcode;
7799 }
7800 return default_seg;
7801 }
7802
7803 static void
7804 output_branch (void)
7805 {
7806 char *p;
7807 int size;
7808 int code16;
7809 int prefix;
7810 relax_substateT subtype;
7811 symbolS *sym;
7812 offsetT off;
7813
7814 code16 = flag_code == CODE_16BIT ? CODE16 : 0;
7815 size = i.disp_encoding == disp_encoding_32bit ? BIG : SMALL;
7816
7817 prefix = 0;
7818 if (i.prefix[DATA_PREFIX] != 0)
7819 {
7820 prefix = 1;
7821 i.prefixes -= 1;
7822 code16 ^= CODE16;
7823 }
7824 /* Pentium4 branch hints. */
7825 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
7826 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
7827 {
7828 prefix++;
7829 i.prefixes--;
7830 }
7831 if (i.prefix[REX_PREFIX] != 0)
7832 {
7833 prefix++;
7834 i.prefixes--;
7835 }
7836
7837 /* BND prefixed jump. */
7838 if (i.prefix[BND_PREFIX] != 0)
7839 {
7840 FRAG_APPEND_1_CHAR (i.prefix[BND_PREFIX]);
7841 i.prefixes -= 1;
7842 }
7843
7844 if (i.prefixes != 0 && !intel_syntax)
7845 as_warn (_("skipping prefixes on this instruction"));
7846
7847 /* It's always a symbol; End frag & setup for relax.
7848 Make sure there is enough room in this frag for the largest
7849 instruction we may generate in md_convert_frag. This is 2
7850 bytes for the opcode and room for the prefix and largest
7851 displacement. */
7852 frag_grow (prefix + 2 + 4);
7853 /* Prefix and 1 opcode byte go in fr_fix. */
7854 p = frag_more (prefix + 1);
7855 if (i.prefix[DATA_PREFIX] != 0)
7856 *p++ = DATA_PREFIX_OPCODE;
7857 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE
7858 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE)
7859 *p++ = i.prefix[SEG_PREFIX];
7860 if (i.prefix[REX_PREFIX] != 0)
7861 *p++ = i.prefix[REX_PREFIX];
7862 *p = i.tm.base_opcode;
7863
7864 if ((unsigned char) *p == JUMP_PC_RELATIVE)
7865 subtype = ENCODE_RELAX_STATE (UNCOND_JUMP, size);
7866 else if (cpu_arch_flags.bitfield.cpui386)
7867 subtype = ENCODE_RELAX_STATE (COND_JUMP, size);
7868 else
7869 subtype = ENCODE_RELAX_STATE (COND_JUMP86, size);
7870 subtype |= code16;
7871
7872 sym = i.op[0].disps->X_add_symbol;
7873 off = i.op[0].disps->X_add_number;
7874
7875 if (i.op[0].disps->X_op != O_constant
7876 && i.op[0].disps->X_op != O_symbol)
7877 {
7878 /* Handle complex expressions. */
7879 sym = make_expr_symbol (i.op[0].disps);
7880 off = 0;
7881 }
7882
7883 /* 1 possible extra opcode + 4 byte displacement go in var part.
7884 Pass reloc in fr_var. */
7885 frag_var (rs_machine_dependent, 5, i.reloc[0], subtype, sym, off, p);
7886 }
7887
7888 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
7889 /* Return TRUE iff PLT32 relocation should be used for branching to
7890 symbol S. */
7891
7892 static bfd_boolean
7893 need_plt32_p (symbolS *s)
7894 {
7895 /* PLT32 relocation is ELF only. */
7896 if (!IS_ELF)
7897 return FALSE;
7898
7899 #ifdef TE_SOLARIS
7900 /* Don't emit PLT32 relocation on Solaris: neither native linker nor
7901 krtld support it. */
7902 return FALSE;
7903 #endif
7904
7905 /* Since there is no need to prepare for PLT branch on x86-64, we
7906 can generate R_X86_64_PLT32, instead of R_X86_64_PC32, which can
7907 be used as a marker for 32-bit PC-relative branches. */
7908 if (!object_64bit)
7909 return FALSE;
7910
7911 /* Weak or undefined symbol need PLT32 relocation. */
7912 if (S_IS_WEAK (s) || !S_IS_DEFINED (s))
7913 return TRUE;
7914
7915 /* Non-global symbol doesn't need PLT32 relocation. */
7916 if (! S_IS_EXTERNAL (s))
7917 return FALSE;
7918
7919 /* Other global symbols need PLT32 relocation. NB: Symbol with
7920 non-default visibilities are treated as normal global symbol
7921 so that PLT32 relocation can be used as a marker for 32-bit
7922 PC-relative branches. It is useful for linker relaxation. */
7923 return TRUE;
7924 }
7925 #endif
7926
7927 static void
7928 output_jump (void)
7929 {
7930 char *p;
7931 int size;
7932 fixS *fixP;
7933 bfd_reloc_code_real_type jump_reloc = i.reloc[0];
7934
7935 if (i.tm.opcode_modifier.jumpbyte)
7936 {
7937 /* This is a loop or jecxz type instruction. */
7938 size = 1;
7939 if (i.prefix[ADDR_PREFIX] != 0)
7940 {
7941 FRAG_APPEND_1_CHAR (ADDR_PREFIX_OPCODE);
7942 i.prefixes -= 1;
7943 }
7944 /* Pentium4 branch hints. */
7945 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
7946 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
7947 {
7948 FRAG_APPEND_1_CHAR (i.prefix[SEG_PREFIX]);
7949 i.prefixes--;
7950 }
7951 }
7952 else
7953 {
7954 int code16;
7955
7956 code16 = 0;
7957 if (flag_code == CODE_16BIT)
7958 code16 = CODE16;
7959
7960 if (i.prefix[DATA_PREFIX] != 0)
7961 {
7962 FRAG_APPEND_1_CHAR (DATA_PREFIX_OPCODE);
7963 i.prefixes -= 1;
7964 code16 ^= CODE16;
7965 }
7966
7967 size = 4;
7968 if (code16)
7969 size = 2;
7970 }
7971
7972 if (i.prefix[REX_PREFIX] != 0)
7973 {
7974 FRAG_APPEND_1_CHAR (i.prefix[REX_PREFIX]);
7975 i.prefixes -= 1;
7976 }
7977
7978 /* BND prefixed jump. */
7979 if (i.prefix[BND_PREFIX] != 0)
7980 {
7981 FRAG_APPEND_1_CHAR (i.prefix[BND_PREFIX]);
7982 i.prefixes -= 1;
7983 }
7984
7985 if (i.prefixes != 0 && !intel_syntax)
7986 as_warn (_("skipping prefixes on this instruction"));
7987
7988 p = frag_more (i.tm.opcode_length + size);
7989 switch (i.tm.opcode_length)
7990 {
7991 case 2:
7992 *p++ = i.tm.base_opcode >> 8;
7993 /* Fall through. */
7994 case 1:
7995 *p++ = i.tm.base_opcode;
7996 break;
7997 default:
7998 abort ();
7999 }
8000
8001 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8002 if (size == 4
8003 && jump_reloc == NO_RELOC
8004 && need_plt32_p (i.op[0].disps->X_add_symbol))
8005 jump_reloc = BFD_RELOC_X86_64_PLT32;
8006 #endif
8007
8008 jump_reloc = reloc (size, 1, 1, jump_reloc);
8009
8010 fixP = fix_new_exp (frag_now, p - frag_now->fr_literal, size,
8011 i.op[0].disps, 1, jump_reloc);
8012
8013 /* All jumps handled here are signed, but don't use a signed limit
8014 check for 32 and 16 bit jumps as we want to allow wrap around at
8015 4G and 64k respectively. */
8016 if (size == 1)
8017 fixP->fx_signed = 1;
8018 }
8019
8020 static void
8021 output_interseg_jump (void)
8022 {
8023 char *p;
8024 int size;
8025 int prefix;
8026 int code16;
8027
8028 code16 = 0;
8029 if (flag_code == CODE_16BIT)
8030 code16 = CODE16;
8031
8032 prefix = 0;
8033 if (i.prefix[DATA_PREFIX] != 0)
8034 {
8035 prefix = 1;
8036 i.prefixes -= 1;
8037 code16 ^= CODE16;
8038 }
8039 if (i.prefix[REX_PREFIX] != 0)
8040 {
8041 prefix++;
8042 i.prefixes -= 1;
8043 }
8044
8045 size = 4;
8046 if (code16)
8047 size = 2;
8048
8049 if (i.prefixes != 0 && !intel_syntax)
8050 as_warn (_("skipping prefixes on this instruction"));
8051
8052 /* 1 opcode; 2 segment; offset */
8053 p = frag_more (prefix + 1 + 2 + size);
8054
8055 if (i.prefix[DATA_PREFIX] != 0)
8056 *p++ = DATA_PREFIX_OPCODE;
8057
8058 if (i.prefix[REX_PREFIX] != 0)
8059 *p++ = i.prefix[REX_PREFIX];
8060
8061 *p++ = i.tm.base_opcode;
8062 if (i.op[1].imms->X_op == O_constant)
8063 {
8064 offsetT n = i.op[1].imms->X_add_number;
8065
8066 if (size == 2
8067 && !fits_in_unsigned_word (n)
8068 && !fits_in_signed_word (n))
8069 {
8070 as_bad (_("16-bit jump out of range"));
8071 return;
8072 }
8073 md_number_to_chars (p, n, size);
8074 }
8075 else
8076 fix_new_exp (frag_now, p - frag_now->fr_literal, size,
8077 i.op[1].imms, 0, reloc (size, 0, 0, i.reloc[1]));
8078 if (i.op[0].imms->X_op != O_constant)
8079 as_bad (_("can't handle non absolute segment in `%s'"),
8080 i.tm.name);
8081 md_number_to_chars (p + size, (valueT) i.op[0].imms->X_add_number, 2);
8082 }
8083
8084 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8085 void
8086 x86_cleanup (void)
8087 {
8088 char *p;
8089 asection *seg = now_seg;
8090 subsegT subseg = now_subseg;
8091 asection *sec;
8092 unsigned int alignment, align_size_1;
8093 unsigned int isa_1_descsz, feature_2_descsz, descsz;
8094 unsigned int isa_1_descsz_raw, feature_2_descsz_raw;
8095 unsigned int padding;
8096
8097 if (!IS_ELF || !x86_used_note)
8098 return;
8099
8100 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_X86;
8101
8102 /* The .note.gnu.property section layout:
8103
8104 Field Length Contents
8105 ---- ---- ----
8106 n_namsz 4 4
8107 n_descsz 4 The note descriptor size
8108 n_type 4 NT_GNU_PROPERTY_TYPE_0
8109 n_name 4 "GNU"
8110 n_desc n_descsz The program property array
8111 .... .... ....
8112 */
8113
8114 /* Create the .note.gnu.property section. */
8115 sec = subseg_new (NOTE_GNU_PROPERTY_SECTION_NAME, 0);
8116 bfd_set_section_flags (sec,
8117 (SEC_ALLOC
8118 | SEC_LOAD
8119 | SEC_DATA
8120 | SEC_HAS_CONTENTS
8121 | SEC_READONLY));
8122
8123 if (get_elf_backend_data (stdoutput)->s->elfclass == ELFCLASS64)
8124 {
8125 align_size_1 = 7;
8126 alignment = 3;
8127 }
8128 else
8129 {
8130 align_size_1 = 3;
8131 alignment = 2;
8132 }
8133
8134 bfd_set_section_alignment (sec, alignment);
8135 elf_section_type (sec) = SHT_NOTE;
8136
8137 /* GNU_PROPERTY_X86_ISA_1_USED: 4-byte type + 4-byte data size
8138 + 4-byte data */
8139 isa_1_descsz_raw = 4 + 4 + 4;
8140 /* Align GNU_PROPERTY_X86_ISA_1_USED. */
8141 isa_1_descsz = (isa_1_descsz_raw + align_size_1) & ~align_size_1;
8142
8143 feature_2_descsz_raw = isa_1_descsz;
8144 /* GNU_PROPERTY_X86_FEATURE_2_USED: 4-byte type + 4-byte data size
8145 + 4-byte data */
8146 feature_2_descsz_raw += 4 + 4 + 4;
8147 /* Align GNU_PROPERTY_X86_FEATURE_2_USED. */
8148 feature_2_descsz = ((feature_2_descsz_raw + align_size_1)
8149 & ~align_size_1);
8150
8151 descsz = feature_2_descsz;
8152 /* Section size: n_namsz + n_descsz + n_type + n_name + n_descsz. */
8153 p = frag_more (4 + 4 + 4 + 4 + descsz);
8154
8155 /* Write n_namsz. */
8156 md_number_to_chars (p, (valueT) 4, 4);
8157
8158 /* Write n_descsz. */
8159 md_number_to_chars (p + 4, (valueT) descsz, 4);
8160
8161 /* Write n_type. */
8162 md_number_to_chars (p + 4 * 2, (valueT) NT_GNU_PROPERTY_TYPE_0, 4);
8163
8164 /* Write n_name. */
8165 memcpy (p + 4 * 3, "GNU", 4);
8166
8167 /* Write 4-byte type. */
8168 md_number_to_chars (p + 4 * 4,
8169 (valueT) GNU_PROPERTY_X86_ISA_1_USED, 4);
8170
8171 /* Write 4-byte data size. */
8172 md_number_to_chars (p + 4 * 5, (valueT) 4, 4);
8173
8174 /* Write 4-byte data. */
8175 md_number_to_chars (p + 4 * 6, (valueT) x86_isa_1_used, 4);
8176
8177 /* Zero out paddings. */
8178 padding = isa_1_descsz - isa_1_descsz_raw;
8179 if (padding)
8180 memset (p + 4 * 7, 0, padding);
8181
8182 /* Write 4-byte type. */
8183 md_number_to_chars (p + isa_1_descsz + 4 * 4,
8184 (valueT) GNU_PROPERTY_X86_FEATURE_2_USED, 4);
8185
8186 /* Write 4-byte data size. */
8187 md_number_to_chars (p + isa_1_descsz + 4 * 5, (valueT) 4, 4);
8188
8189 /* Write 4-byte data. */
8190 md_number_to_chars (p + isa_1_descsz + 4 * 6,
8191 (valueT) x86_feature_2_used, 4);
8192
8193 /* Zero out paddings. */
8194 padding = feature_2_descsz - feature_2_descsz_raw;
8195 if (padding)
8196 memset (p + isa_1_descsz + 4 * 7, 0, padding);
8197
8198 /* We probably can't restore the current segment, for there likely
8199 isn't one yet... */
8200 if (seg && subseg)
8201 subseg_set (seg, subseg);
8202 }
8203 #endif
8204
8205 static unsigned int
8206 encoding_length (const fragS *start_frag, offsetT start_off,
8207 const char *frag_now_ptr)
8208 {
8209 unsigned int len = 0;
8210
8211 if (start_frag != frag_now)
8212 {
8213 const fragS *fr = start_frag;
8214
8215 do {
8216 len += fr->fr_fix;
8217 fr = fr->fr_next;
8218 } while (fr && fr != frag_now);
8219 }
8220
8221 return len - start_off + (frag_now_ptr - frag_now->fr_literal);
8222 }
8223
8224 static void
8225 output_insn (void)
8226 {
8227 fragS *insn_start_frag;
8228 offsetT insn_start_off;
8229
8230 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8231 if (IS_ELF && x86_used_note)
8232 {
8233 if (i.tm.cpu_flags.bitfield.cpucmov)
8234 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_CMOV;
8235 if (i.tm.cpu_flags.bitfield.cpusse)
8236 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE;
8237 if (i.tm.cpu_flags.bitfield.cpusse2)
8238 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE2;
8239 if (i.tm.cpu_flags.bitfield.cpusse3)
8240 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE3;
8241 if (i.tm.cpu_flags.bitfield.cpussse3)
8242 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSSE3;
8243 if (i.tm.cpu_flags.bitfield.cpusse4_1)
8244 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE4_1;
8245 if (i.tm.cpu_flags.bitfield.cpusse4_2)
8246 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE4_2;
8247 if (i.tm.cpu_flags.bitfield.cpuavx)
8248 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX;
8249 if (i.tm.cpu_flags.bitfield.cpuavx2)
8250 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX2;
8251 if (i.tm.cpu_flags.bitfield.cpufma)
8252 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_FMA;
8253 if (i.tm.cpu_flags.bitfield.cpuavx512f)
8254 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512F;
8255 if (i.tm.cpu_flags.bitfield.cpuavx512cd)
8256 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512CD;
8257 if (i.tm.cpu_flags.bitfield.cpuavx512er)
8258 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512ER;
8259 if (i.tm.cpu_flags.bitfield.cpuavx512pf)
8260 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512PF;
8261 if (i.tm.cpu_flags.bitfield.cpuavx512vl)
8262 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512VL;
8263 if (i.tm.cpu_flags.bitfield.cpuavx512dq)
8264 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512DQ;
8265 if (i.tm.cpu_flags.bitfield.cpuavx512bw)
8266 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512BW;
8267 if (i.tm.cpu_flags.bitfield.cpuavx512_4fmaps)
8268 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_4FMAPS;
8269 if (i.tm.cpu_flags.bitfield.cpuavx512_4vnniw)
8270 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_4VNNIW;
8271 if (i.tm.cpu_flags.bitfield.cpuavx512_bitalg)
8272 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_BITALG;
8273 if (i.tm.cpu_flags.bitfield.cpuavx512ifma)
8274 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_IFMA;
8275 if (i.tm.cpu_flags.bitfield.cpuavx512vbmi)
8276 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_VBMI;
8277 if (i.tm.cpu_flags.bitfield.cpuavx512_vbmi2)
8278 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_VBMI2;
8279 if (i.tm.cpu_flags.bitfield.cpuavx512_vnni)
8280 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_VNNI;
8281 if (i.tm.cpu_flags.bitfield.cpuavx512_bf16)
8282 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_BF16;
8283
8284 if (i.tm.cpu_flags.bitfield.cpu8087
8285 || i.tm.cpu_flags.bitfield.cpu287
8286 || i.tm.cpu_flags.bitfield.cpu387
8287 || i.tm.cpu_flags.bitfield.cpu687
8288 || i.tm.cpu_flags.bitfield.cpufisttp)
8289 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_X87;
8290 /* Don't set GNU_PROPERTY_X86_FEATURE_2_MMX for prefetchtXXX nor
8291 Xfence instructions. */
8292 if (i.tm.base_opcode != 0xf18
8293 && i.tm.base_opcode != 0xf0d
8294 && i.tm.base_opcode != 0xfaef8
8295 && (i.has_regmmx
8296 || i.tm.cpu_flags.bitfield.cpummx
8297 || i.tm.cpu_flags.bitfield.cpua3dnow
8298 || i.tm.cpu_flags.bitfield.cpua3dnowa))
8299 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_MMX;
8300 if (i.has_regxmm)
8301 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XMM;
8302 if (i.has_regymm)
8303 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_YMM;
8304 if (i.has_regzmm)
8305 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_ZMM;
8306 if (i.tm.cpu_flags.bitfield.cpufxsr)
8307 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_FXSR;
8308 if (i.tm.cpu_flags.bitfield.cpuxsave)
8309 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVE;
8310 if (i.tm.cpu_flags.bitfield.cpuxsaveopt)
8311 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVEOPT;
8312 if (i.tm.cpu_flags.bitfield.cpuxsavec)
8313 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVEC;
8314 }
8315 #endif
8316
8317 /* Tie dwarf2 debug info to the address at the start of the insn.
8318 We can't do this after the insn has been output as the current
8319 frag may have been closed off. eg. by frag_var. */
8320 dwarf2_emit_insn (0);
8321
8322 insn_start_frag = frag_now;
8323 insn_start_off = frag_now_fix ();
8324
8325 /* Output jumps. */
8326 if (i.tm.opcode_modifier.jump)
8327 output_branch ();
8328 else if (i.tm.opcode_modifier.jumpbyte
8329 || i.tm.opcode_modifier.jumpdword)
8330 output_jump ();
8331 else if (i.tm.opcode_modifier.jumpintersegment)
8332 output_interseg_jump ();
8333 else
8334 {
8335 /* Output normal instructions here. */
8336 char *p;
8337 unsigned char *q;
8338 unsigned int j;
8339 unsigned int prefix;
8340
8341 if (avoid_fence
8342 && (i.tm.base_opcode == 0xfaee8
8343 || i.tm.base_opcode == 0xfaef0
8344 || i.tm.base_opcode == 0xfaef8))
8345 {
8346 /* Encode lfence, mfence, and sfence as
8347 f0 83 04 24 00 lock addl $0x0, (%{re}sp). */
8348 offsetT val = 0x240483f0ULL;
8349 p = frag_more (5);
8350 md_number_to_chars (p, val, 5);
8351 return;
8352 }
8353
8354 /* Some processors fail on LOCK prefix. This options makes
8355 assembler ignore LOCK prefix and serves as a workaround. */
8356 if (omit_lock_prefix)
8357 {
8358 if (i.tm.base_opcode == LOCK_PREFIX_OPCODE)
8359 return;
8360 i.prefix[LOCK_PREFIX] = 0;
8361 }
8362
8363 /* Since the VEX/EVEX prefix contains the implicit prefix, we
8364 don't need the explicit prefix. */
8365 if (!i.tm.opcode_modifier.vex && !i.tm.opcode_modifier.evex)
8366 {
8367 switch (i.tm.opcode_length)
8368 {
8369 case 3:
8370 if (i.tm.base_opcode & 0xff000000)
8371 {
8372 prefix = (i.tm.base_opcode >> 24) & 0xff;
8373 if (!i.tm.cpu_flags.bitfield.cpupadlock
8374 || prefix != REPE_PREFIX_OPCODE
8375 || (i.prefix[REP_PREFIX] != REPE_PREFIX_OPCODE))
8376 add_prefix (prefix);
8377 }
8378 break;
8379 case 2:
8380 if ((i.tm.base_opcode & 0xff0000) != 0)
8381 {
8382 prefix = (i.tm.base_opcode >> 16) & 0xff;
8383 add_prefix (prefix);
8384 }
8385 break;
8386 case 1:
8387 break;
8388 case 0:
8389 /* Check for pseudo prefixes. */
8390 as_bad_where (insn_start_frag->fr_file,
8391 insn_start_frag->fr_line,
8392 _("pseudo prefix without instruction"));
8393 return;
8394 default:
8395 abort ();
8396 }
8397
8398 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
8399 /* For x32, add a dummy REX_OPCODE prefix for mov/add with
8400 R_X86_64_GOTTPOFF relocation so that linker can safely
8401 perform IE->LE optimization. */
8402 if (x86_elf_abi == X86_64_X32_ABI
8403 && i.operands == 2
8404 && i.reloc[0] == BFD_RELOC_X86_64_GOTTPOFF
8405 && i.prefix[REX_PREFIX] == 0)
8406 add_prefix (REX_OPCODE);
8407 #endif
8408
8409 /* The prefix bytes. */
8410 for (j = ARRAY_SIZE (i.prefix), q = i.prefix; j > 0; j--, q++)
8411 if (*q)
8412 FRAG_APPEND_1_CHAR (*q);
8413 }
8414 else
8415 {
8416 for (j = 0, q = i.prefix; j < ARRAY_SIZE (i.prefix); j++, q++)
8417 if (*q)
8418 switch (j)
8419 {
8420 case REX_PREFIX:
8421 /* REX byte is encoded in VEX prefix. */
8422 break;
8423 case SEG_PREFIX:
8424 case ADDR_PREFIX:
8425 FRAG_APPEND_1_CHAR (*q);
8426 break;
8427 default:
8428 /* There should be no other prefixes for instructions
8429 with VEX prefix. */
8430 abort ();
8431 }
8432
8433 /* For EVEX instructions i.vrex should become 0 after
8434 build_evex_prefix. For VEX instructions upper 16 registers
8435 aren't available, so VREX should be 0. */
8436 if (i.vrex)
8437 abort ();
8438 /* Now the VEX prefix. */
8439 p = frag_more (i.vex.length);
8440 for (j = 0; j < i.vex.length; j++)
8441 p[j] = i.vex.bytes[j];
8442 }
8443
8444 /* Now the opcode; be careful about word order here! */
8445 if (i.tm.opcode_length == 1)
8446 {
8447 FRAG_APPEND_1_CHAR (i.tm.base_opcode);
8448 }
8449 else
8450 {
8451 switch (i.tm.opcode_length)
8452 {
8453 case 4:
8454 p = frag_more (4);
8455 *p++ = (i.tm.base_opcode >> 24) & 0xff;
8456 *p++ = (i.tm.base_opcode >> 16) & 0xff;
8457 break;
8458 case 3:
8459 p = frag_more (3);
8460 *p++ = (i.tm.base_opcode >> 16) & 0xff;
8461 break;
8462 case 2:
8463 p = frag_more (2);
8464 break;
8465 default:
8466 abort ();
8467 break;
8468 }
8469
8470 /* Put out high byte first: can't use md_number_to_chars! */
8471 *p++ = (i.tm.base_opcode >> 8) & 0xff;
8472 *p = i.tm.base_opcode & 0xff;
8473 }
8474
8475 /* Now the modrm byte and sib byte (if present). */
8476 if (i.tm.opcode_modifier.modrm)
8477 {
8478 FRAG_APPEND_1_CHAR ((i.rm.regmem << 0
8479 | i.rm.reg << 3
8480 | i.rm.mode << 6));
8481 /* If i.rm.regmem == ESP (4)
8482 && i.rm.mode != (Register mode)
8483 && not 16 bit
8484 ==> need second modrm byte. */
8485 if (i.rm.regmem == ESCAPE_TO_TWO_BYTE_ADDRESSING
8486 && i.rm.mode != 3
8487 && !(i.base_reg && i.base_reg->reg_type.bitfield.word))
8488 FRAG_APPEND_1_CHAR ((i.sib.base << 0
8489 | i.sib.index << 3
8490 | i.sib.scale << 6));
8491 }
8492
8493 if (i.disp_operands)
8494 output_disp (insn_start_frag, insn_start_off);
8495
8496 if (i.imm_operands)
8497 output_imm (insn_start_frag, insn_start_off);
8498
8499 /*
8500 * frag_now_fix () returning plain abs_section_offset when we're in the
8501 * absolute section, and abs_section_offset not getting updated as data
8502 * gets added to the frag breaks the logic below.
8503 */
8504 if (now_seg != absolute_section)
8505 {
8506 j = encoding_length (insn_start_frag, insn_start_off, frag_more (0));
8507 if (j > 15)
8508 as_warn (_("instruction length of %u bytes exceeds the limit of 15"),
8509 j);
8510 }
8511 }
8512
8513 #ifdef DEBUG386
8514 if (flag_debug)
8515 {
8516 pi ("" /*line*/, &i);
8517 }
8518 #endif /* DEBUG386 */
8519 }
8520
8521 /* Return the size of the displacement operand N. */
8522
8523 static int
8524 disp_size (unsigned int n)
8525 {
8526 int size = 4;
8527
8528 if (i.types[n].bitfield.disp64)
8529 size = 8;
8530 else if (i.types[n].bitfield.disp8)
8531 size = 1;
8532 else if (i.types[n].bitfield.disp16)
8533 size = 2;
8534 return size;
8535 }
8536
8537 /* Return the size of the immediate operand N. */
8538
8539 static int
8540 imm_size (unsigned int n)
8541 {
8542 int size = 4;
8543 if (i.types[n].bitfield.imm64)
8544 size = 8;
8545 else if (i.types[n].bitfield.imm8 || i.types[n].bitfield.imm8s)
8546 size = 1;
8547 else if (i.types[n].bitfield.imm16)
8548 size = 2;
8549 return size;
8550 }
8551
8552 static void
8553 output_disp (fragS *insn_start_frag, offsetT insn_start_off)
8554 {
8555 char *p;
8556 unsigned int n;
8557
8558 for (n = 0; n < i.operands; n++)
8559 {
8560 if (operand_type_check (i.types[n], disp))
8561 {
8562 if (i.op[n].disps->X_op == O_constant)
8563 {
8564 int size = disp_size (n);
8565 offsetT val = i.op[n].disps->X_add_number;
8566
8567 val = offset_in_range (val >> (size == 1 ? i.memshift : 0),
8568 size);
8569 p = frag_more (size);
8570 md_number_to_chars (p, val, size);
8571 }
8572 else
8573 {
8574 enum bfd_reloc_code_real reloc_type;
8575 int size = disp_size (n);
8576 int sign = i.types[n].bitfield.disp32s;
8577 int pcrel = (i.flags[n] & Operand_PCrel) != 0;
8578 fixS *fixP;
8579
8580 /* We can't have 8 bit displacement here. */
8581 gas_assert (!i.types[n].bitfield.disp8);
8582
8583 /* The PC relative address is computed relative
8584 to the instruction boundary, so in case immediate
8585 fields follows, we need to adjust the value. */
8586 if (pcrel && i.imm_operands)
8587 {
8588 unsigned int n1;
8589 int sz = 0;
8590
8591 for (n1 = 0; n1 < i.operands; n1++)
8592 if (operand_type_check (i.types[n1], imm))
8593 {
8594 /* Only one immediate is allowed for PC
8595 relative address. */
8596 gas_assert (sz == 0);
8597 sz = imm_size (n1);
8598 i.op[n].disps->X_add_number -= sz;
8599 }
8600 /* We should find the immediate. */
8601 gas_assert (sz != 0);
8602 }
8603
8604 p = frag_more (size);
8605 reloc_type = reloc (size, pcrel, sign, i.reloc[n]);
8606 if (GOT_symbol
8607 && GOT_symbol == i.op[n].disps->X_add_symbol
8608 && (((reloc_type == BFD_RELOC_32
8609 || reloc_type == BFD_RELOC_X86_64_32S
8610 || (reloc_type == BFD_RELOC_64
8611 && object_64bit))
8612 && (i.op[n].disps->X_op == O_symbol
8613 || (i.op[n].disps->X_op == O_add
8614 && ((symbol_get_value_expression
8615 (i.op[n].disps->X_op_symbol)->X_op)
8616 == O_subtract))))
8617 || reloc_type == BFD_RELOC_32_PCREL))
8618 {
8619 if (!object_64bit)
8620 {
8621 reloc_type = BFD_RELOC_386_GOTPC;
8622 i.op[n].imms->X_add_number +=
8623 encoding_length (insn_start_frag, insn_start_off, p);
8624 }
8625 else if (reloc_type == BFD_RELOC_64)
8626 reloc_type = BFD_RELOC_X86_64_GOTPC64;
8627 else
8628 /* Don't do the adjustment for x86-64, as there
8629 the pcrel addressing is relative to the _next_
8630 insn, and that is taken care of in other code. */
8631 reloc_type = BFD_RELOC_X86_64_GOTPC32;
8632 }
8633 fixP = fix_new_exp (frag_now, p - frag_now->fr_literal,
8634 size, i.op[n].disps, pcrel,
8635 reloc_type);
8636 /* Check for "call/jmp *mem", "mov mem, %reg",
8637 "test %reg, mem" and "binop mem, %reg" where binop
8638 is one of adc, add, and, cmp, or, sbb, sub, xor
8639 instructions without data prefix. Always generate
8640 R_386_GOT32X for "sym*GOT" operand in 32-bit mode. */
8641 if (i.prefix[DATA_PREFIX] == 0
8642 && (generate_relax_relocations
8643 || (!object_64bit
8644 && i.rm.mode == 0
8645 && i.rm.regmem == 5))
8646 && (i.rm.mode == 2
8647 || (i.rm.mode == 0 && i.rm.regmem == 5))
8648 && ((i.operands == 1
8649 && i.tm.base_opcode == 0xff
8650 && (i.rm.reg == 2 || i.rm.reg == 4))
8651 || (i.operands == 2
8652 && (i.tm.base_opcode == 0x8b
8653 || i.tm.base_opcode == 0x85
8654 || (i.tm.base_opcode & 0xc7) == 0x03))))
8655 {
8656 if (object_64bit)
8657 {
8658 fixP->fx_tcbit = i.rex != 0;
8659 if (i.base_reg
8660 && (i.base_reg->reg_num == RegIP))
8661 fixP->fx_tcbit2 = 1;
8662 }
8663 else
8664 fixP->fx_tcbit2 = 1;
8665 }
8666 }
8667 }
8668 }
8669 }
8670
8671 static void
8672 output_imm (fragS *insn_start_frag, offsetT insn_start_off)
8673 {
8674 char *p;
8675 unsigned int n;
8676
8677 for (n = 0; n < i.operands; n++)
8678 {
8679 /* Skip SAE/RC Imm operand in EVEX. They are already handled. */
8680 if (i.rounding && (int) n == i.rounding->operand)
8681 continue;
8682
8683 if (operand_type_check (i.types[n], imm))
8684 {
8685 if (i.op[n].imms->X_op == O_constant)
8686 {
8687 int size = imm_size (n);
8688 offsetT val;
8689
8690 val = offset_in_range (i.op[n].imms->X_add_number,
8691 size);
8692 p = frag_more (size);
8693 md_number_to_chars (p, val, size);
8694 }
8695 else
8696 {
8697 /* Not absolute_section.
8698 Need a 32-bit fixup (don't support 8bit
8699 non-absolute imms). Try to support other
8700 sizes ... */
8701 enum bfd_reloc_code_real reloc_type;
8702 int size = imm_size (n);
8703 int sign;
8704
8705 if (i.types[n].bitfield.imm32s
8706 && (i.suffix == QWORD_MNEM_SUFFIX
8707 || (!i.suffix && i.tm.opcode_modifier.no_lsuf)))
8708 sign = 1;
8709 else
8710 sign = 0;
8711
8712 p = frag_more (size);
8713 reloc_type = reloc (size, 0, sign, i.reloc[n]);
8714
8715 /* This is tough to explain. We end up with this one if we
8716 * have operands that look like
8717 * "_GLOBAL_OFFSET_TABLE_+[.-.L284]". The goal here is to
8718 * obtain the absolute address of the GOT, and it is strongly
8719 * preferable from a performance point of view to avoid using
8720 * a runtime relocation for this. The actual sequence of
8721 * instructions often look something like:
8722 *
8723 * call .L66
8724 * .L66:
8725 * popl %ebx
8726 * addl $_GLOBAL_OFFSET_TABLE_+[.-.L66],%ebx
8727 *
8728 * The call and pop essentially return the absolute address
8729 * of the label .L66 and store it in %ebx. The linker itself
8730 * will ultimately change the first operand of the addl so
8731 * that %ebx points to the GOT, but to keep things simple, the
8732 * .o file must have this operand set so that it generates not
8733 * the absolute address of .L66, but the absolute address of
8734 * itself. This allows the linker itself simply treat a GOTPC
8735 * relocation as asking for a pcrel offset to the GOT to be
8736 * added in, and the addend of the relocation is stored in the
8737 * operand field for the instruction itself.
8738 *
8739 * Our job here is to fix the operand so that it would add
8740 * the correct offset so that %ebx would point to itself. The
8741 * thing that is tricky is that .-.L66 will point to the
8742 * beginning of the instruction, so we need to further modify
8743 * the operand so that it will point to itself. There are
8744 * other cases where you have something like:
8745 *
8746 * .long $_GLOBAL_OFFSET_TABLE_+[.-.L66]
8747 *
8748 * and here no correction would be required. Internally in
8749 * the assembler we treat operands of this form as not being
8750 * pcrel since the '.' is explicitly mentioned, and I wonder
8751 * whether it would simplify matters to do it this way. Who
8752 * knows. In earlier versions of the PIC patches, the
8753 * pcrel_adjust field was used to store the correction, but
8754 * since the expression is not pcrel, I felt it would be
8755 * confusing to do it this way. */
8756
8757 if ((reloc_type == BFD_RELOC_32
8758 || reloc_type == BFD_RELOC_X86_64_32S
8759 || reloc_type == BFD_RELOC_64)
8760 && GOT_symbol
8761 && GOT_symbol == i.op[n].imms->X_add_symbol
8762 && (i.op[n].imms->X_op == O_symbol
8763 || (i.op[n].imms->X_op == O_add
8764 && ((symbol_get_value_expression
8765 (i.op[n].imms->X_op_symbol)->X_op)
8766 == O_subtract))))
8767 {
8768 if (!object_64bit)
8769 reloc_type = BFD_RELOC_386_GOTPC;
8770 else if (size == 4)
8771 reloc_type = BFD_RELOC_X86_64_GOTPC32;
8772 else if (size == 8)
8773 reloc_type = BFD_RELOC_X86_64_GOTPC64;
8774 i.op[n].imms->X_add_number +=
8775 encoding_length (insn_start_frag, insn_start_off, p);
8776 }
8777 fix_new_exp (frag_now, p - frag_now->fr_literal, size,
8778 i.op[n].imms, 0, reloc_type);
8779 }
8780 }
8781 }
8782 }
8783 \f
8784 /* x86_cons_fix_new is called via the expression parsing code when a
8785 reloc is needed. We use this hook to get the correct .got reloc. */
8786 static int cons_sign = -1;
8787
8788 void
8789 x86_cons_fix_new (fragS *frag, unsigned int off, unsigned int len,
8790 expressionS *exp, bfd_reloc_code_real_type r)
8791 {
8792 r = reloc (len, 0, cons_sign, r);
8793
8794 #ifdef TE_PE
8795 if (exp->X_op == O_secrel)
8796 {
8797 exp->X_op = O_symbol;
8798 r = BFD_RELOC_32_SECREL;
8799 }
8800 #endif
8801
8802 fix_new_exp (frag, off, len, exp, 0, r);
8803 }
8804
8805 /* Export the ABI address size for use by TC_ADDRESS_BYTES for the
8806 purpose of the `.dc.a' internal pseudo-op. */
8807
8808 int
8809 x86_address_bytes (void)
8810 {
8811 if ((stdoutput->arch_info->mach & bfd_mach_x64_32))
8812 return 4;
8813 return stdoutput->arch_info->bits_per_address / 8;
8814 }
8815
8816 #if !(defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) || defined (OBJ_MACH_O)) \
8817 || defined (LEX_AT)
8818 # define lex_got(reloc, adjust, types) NULL
8819 #else
8820 /* Parse operands of the form
8821 <symbol>@GOTOFF+<nnn>
8822 and similar .plt or .got references.
8823
8824 If we find one, set up the correct relocation in RELOC and copy the
8825 input string, minus the `@GOTOFF' into a malloc'd buffer for
8826 parsing by the calling routine. Return this buffer, and if ADJUST
8827 is non-null set it to the length of the string we removed from the
8828 input line. Otherwise return NULL. */
8829 static char *
8830 lex_got (enum bfd_reloc_code_real *rel,
8831 int *adjust,
8832 i386_operand_type *types)
8833 {
8834 /* Some of the relocations depend on the size of what field is to
8835 be relocated. But in our callers i386_immediate and i386_displacement
8836 we don't yet know the operand size (this will be set by insn
8837 matching). Hence we record the word32 relocation here,
8838 and adjust the reloc according to the real size in reloc(). */
8839 static const struct {
8840 const char *str;
8841 int len;
8842 const enum bfd_reloc_code_real rel[2];
8843 const i386_operand_type types64;
8844 } gotrel[] = {
8845 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8846 { STRING_COMMA_LEN ("SIZE"), { BFD_RELOC_SIZE32,
8847 BFD_RELOC_SIZE32 },
8848 OPERAND_TYPE_IMM32_64 },
8849 #endif
8850 { STRING_COMMA_LEN ("PLTOFF"), { _dummy_first_bfd_reloc_code_real,
8851 BFD_RELOC_X86_64_PLTOFF64 },
8852 OPERAND_TYPE_IMM64 },
8853 { STRING_COMMA_LEN ("PLT"), { BFD_RELOC_386_PLT32,
8854 BFD_RELOC_X86_64_PLT32 },
8855 OPERAND_TYPE_IMM32_32S_DISP32 },
8856 { STRING_COMMA_LEN ("GOTPLT"), { _dummy_first_bfd_reloc_code_real,
8857 BFD_RELOC_X86_64_GOTPLT64 },
8858 OPERAND_TYPE_IMM64_DISP64 },
8859 { STRING_COMMA_LEN ("GOTOFF"), { BFD_RELOC_386_GOTOFF,
8860 BFD_RELOC_X86_64_GOTOFF64 },
8861 OPERAND_TYPE_IMM64_DISP64 },
8862 { STRING_COMMA_LEN ("GOTPCREL"), { _dummy_first_bfd_reloc_code_real,
8863 BFD_RELOC_X86_64_GOTPCREL },
8864 OPERAND_TYPE_IMM32_32S_DISP32 },
8865 { STRING_COMMA_LEN ("TLSGD"), { BFD_RELOC_386_TLS_GD,
8866 BFD_RELOC_X86_64_TLSGD },
8867 OPERAND_TYPE_IMM32_32S_DISP32 },
8868 { STRING_COMMA_LEN ("TLSLDM"), { BFD_RELOC_386_TLS_LDM,
8869 _dummy_first_bfd_reloc_code_real },
8870 OPERAND_TYPE_NONE },
8871 { STRING_COMMA_LEN ("TLSLD"), { _dummy_first_bfd_reloc_code_real,
8872 BFD_RELOC_X86_64_TLSLD },
8873 OPERAND_TYPE_IMM32_32S_DISP32 },
8874 { STRING_COMMA_LEN ("GOTTPOFF"), { BFD_RELOC_386_TLS_IE_32,
8875 BFD_RELOC_X86_64_GOTTPOFF },
8876 OPERAND_TYPE_IMM32_32S_DISP32 },
8877 { STRING_COMMA_LEN ("TPOFF"), { BFD_RELOC_386_TLS_LE_32,
8878 BFD_RELOC_X86_64_TPOFF32 },
8879 OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
8880 { STRING_COMMA_LEN ("NTPOFF"), { BFD_RELOC_386_TLS_LE,
8881 _dummy_first_bfd_reloc_code_real },
8882 OPERAND_TYPE_NONE },
8883 { STRING_COMMA_LEN ("DTPOFF"), { BFD_RELOC_386_TLS_LDO_32,
8884 BFD_RELOC_X86_64_DTPOFF32 },
8885 OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
8886 { STRING_COMMA_LEN ("GOTNTPOFF"),{ BFD_RELOC_386_TLS_GOTIE,
8887 _dummy_first_bfd_reloc_code_real },
8888 OPERAND_TYPE_NONE },
8889 { STRING_COMMA_LEN ("INDNTPOFF"),{ BFD_RELOC_386_TLS_IE,
8890 _dummy_first_bfd_reloc_code_real },
8891 OPERAND_TYPE_NONE },
8892 { STRING_COMMA_LEN ("GOT"), { BFD_RELOC_386_GOT32,
8893 BFD_RELOC_X86_64_GOT32 },
8894 OPERAND_TYPE_IMM32_32S_64_DISP32 },
8895 { STRING_COMMA_LEN ("TLSDESC"), { BFD_RELOC_386_TLS_GOTDESC,
8896 BFD_RELOC_X86_64_GOTPC32_TLSDESC },
8897 OPERAND_TYPE_IMM32_32S_DISP32 },
8898 { STRING_COMMA_LEN ("TLSCALL"), { BFD_RELOC_386_TLS_DESC_CALL,
8899 BFD_RELOC_X86_64_TLSDESC_CALL },
8900 OPERAND_TYPE_IMM32_32S_DISP32 },
8901 };
8902 char *cp;
8903 unsigned int j;
8904
8905 #if defined (OBJ_MAYBE_ELF)
8906 if (!IS_ELF)
8907 return NULL;
8908 #endif
8909
8910 for (cp = input_line_pointer; *cp != '@'; cp++)
8911 if (is_end_of_line[(unsigned char) *cp] || *cp == ',')
8912 return NULL;
8913
8914 for (j = 0; j < ARRAY_SIZE (gotrel); j++)
8915 {
8916 int len = gotrel[j].len;
8917 if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
8918 {
8919 if (gotrel[j].rel[object_64bit] != 0)
8920 {
8921 int first, second;
8922 char *tmpbuf, *past_reloc;
8923
8924 *rel = gotrel[j].rel[object_64bit];
8925
8926 if (types)
8927 {
8928 if (flag_code != CODE_64BIT)
8929 {
8930 types->bitfield.imm32 = 1;
8931 types->bitfield.disp32 = 1;
8932 }
8933 else
8934 *types = gotrel[j].types64;
8935 }
8936
8937 if (j != 0 && GOT_symbol == NULL)
8938 GOT_symbol = symbol_find_or_make (GLOBAL_OFFSET_TABLE_NAME);
8939
8940 /* The length of the first part of our input line. */
8941 first = cp - input_line_pointer;
8942
8943 /* The second part goes from after the reloc token until
8944 (and including) an end_of_line char or comma. */
8945 past_reloc = cp + 1 + len;
8946 cp = past_reloc;
8947 while (!is_end_of_line[(unsigned char) *cp] && *cp != ',')
8948 ++cp;
8949 second = cp + 1 - past_reloc;
8950
8951 /* Allocate and copy string. The trailing NUL shouldn't
8952 be necessary, but be safe. */
8953 tmpbuf = XNEWVEC (char, first + second + 2);
8954 memcpy (tmpbuf, input_line_pointer, first);
8955 if (second != 0 && *past_reloc != ' ')
8956 /* Replace the relocation token with ' ', so that
8957 errors like foo@GOTOFF1 will be detected. */
8958 tmpbuf[first++] = ' ';
8959 else
8960 /* Increment length by 1 if the relocation token is
8961 removed. */
8962 len++;
8963 if (adjust)
8964 *adjust = len;
8965 memcpy (tmpbuf + first, past_reloc, second);
8966 tmpbuf[first + second] = '\0';
8967 return tmpbuf;
8968 }
8969
8970 as_bad (_("@%s reloc is not supported with %d-bit output format"),
8971 gotrel[j].str, 1 << (5 + object_64bit));
8972 return NULL;
8973 }
8974 }
8975
8976 /* Might be a symbol version string. Don't as_bad here. */
8977 return NULL;
8978 }
8979 #endif
8980
8981 #ifdef TE_PE
8982 #ifdef lex_got
8983 #undef lex_got
8984 #endif
8985 /* Parse operands of the form
8986 <symbol>@SECREL32+<nnn>
8987
8988 If we find one, set up the correct relocation in RELOC and copy the
8989 input string, minus the `@SECREL32' into a malloc'd buffer for
8990 parsing by the calling routine. Return this buffer, and if ADJUST
8991 is non-null set it to the length of the string we removed from the
8992 input line. Otherwise return NULL.
8993
8994 This function is copied from the ELF version above adjusted for PE targets. */
8995
8996 static char *
8997 lex_got (enum bfd_reloc_code_real *rel ATTRIBUTE_UNUSED,
8998 int *adjust ATTRIBUTE_UNUSED,
8999 i386_operand_type *types)
9000 {
9001 static const struct
9002 {
9003 const char *str;
9004 int len;
9005 const enum bfd_reloc_code_real rel[2];
9006 const i386_operand_type types64;
9007 }
9008 gotrel[] =
9009 {
9010 { STRING_COMMA_LEN ("SECREL32"), { BFD_RELOC_32_SECREL,
9011 BFD_RELOC_32_SECREL },
9012 OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
9013 };
9014
9015 char *cp;
9016 unsigned j;
9017
9018 for (cp = input_line_pointer; *cp != '@'; cp++)
9019 if (is_end_of_line[(unsigned char) *cp] || *cp == ',')
9020 return NULL;
9021
9022 for (j = 0; j < ARRAY_SIZE (gotrel); j++)
9023 {
9024 int len = gotrel[j].len;
9025
9026 if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
9027 {
9028 if (gotrel[j].rel[object_64bit] != 0)
9029 {
9030 int first, second;
9031 char *tmpbuf, *past_reloc;
9032
9033 *rel = gotrel[j].rel[object_64bit];
9034 if (adjust)
9035 *adjust = len;
9036
9037 if (types)
9038 {
9039 if (flag_code != CODE_64BIT)
9040 {
9041 types->bitfield.imm32 = 1;
9042 types->bitfield.disp32 = 1;
9043 }
9044 else
9045 *types = gotrel[j].types64;
9046 }
9047
9048 /* The length of the first part of our input line. */
9049 first = cp - input_line_pointer;
9050
9051 /* The second part goes from after the reloc token until
9052 (and including) an end_of_line char or comma. */
9053 past_reloc = cp + 1 + len;
9054 cp = past_reloc;
9055 while (!is_end_of_line[(unsigned char) *cp] && *cp != ',')
9056 ++cp;
9057 second = cp + 1 - past_reloc;
9058
9059 /* Allocate and copy string. The trailing NUL shouldn't
9060 be necessary, but be safe. */
9061 tmpbuf = XNEWVEC (char, first + second + 2);
9062 memcpy (tmpbuf, input_line_pointer, first);
9063 if (second != 0 && *past_reloc != ' ')
9064 /* Replace the relocation token with ' ', so that
9065 errors like foo@SECLREL321 will be detected. */
9066 tmpbuf[first++] = ' ';
9067 memcpy (tmpbuf + first, past_reloc, second);
9068 tmpbuf[first + second] = '\0';
9069 return tmpbuf;
9070 }
9071
9072 as_bad (_("@%s reloc is not supported with %d-bit output format"),
9073 gotrel[j].str, 1 << (5 + object_64bit));
9074 return NULL;
9075 }
9076 }
9077
9078 /* Might be a symbol version string. Don't as_bad here. */
9079 return NULL;
9080 }
9081
9082 #endif /* TE_PE */
9083
9084 bfd_reloc_code_real_type
9085 x86_cons (expressionS *exp, int size)
9086 {
9087 bfd_reloc_code_real_type got_reloc = NO_RELOC;
9088
9089 intel_syntax = -intel_syntax;
9090
9091 exp->X_md = 0;
9092 if (size == 4 || (object_64bit && size == 8))
9093 {
9094 /* Handle @GOTOFF and the like in an expression. */
9095 char *save;
9096 char *gotfree_input_line;
9097 int adjust = 0;
9098
9099 save = input_line_pointer;
9100 gotfree_input_line = lex_got (&got_reloc, &adjust, NULL);
9101 if (gotfree_input_line)
9102 input_line_pointer = gotfree_input_line;
9103
9104 expression (exp);
9105
9106 if (gotfree_input_line)
9107 {
9108 /* expression () has merrily parsed up to the end of line,
9109 or a comma - in the wrong buffer. Transfer how far
9110 input_line_pointer has moved to the right buffer. */
9111 input_line_pointer = (save
9112 + (input_line_pointer - gotfree_input_line)
9113 + adjust);
9114 free (gotfree_input_line);
9115 if (exp->X_op == O_constant
9116 || exp->X_op == O_absent
9117 || exp->X_op == O_illegal
9118 || exp->X_op == O_register
9119 || exp->X_op == O_big)
9120 {
9121 char c = *input_line_pointer;
9122 *input_line_pointer = 0;
9123 as_bad (_("missing or invalid expression `%s'"), save);
9124 *input_line_pointer = c;
9125 }
9126 else if ((got_reloc == BFD_RELOC_386_PLT32
9127 || got_reloc == BFD_RELOC_X86_64_PLT32)
9128 && exp->X_op != O_symbol)
9129 {
9130 char c = *input_line_pointer;
9131 *input_line_pointer = 0;
9132 as_bad (_("invalid PLT expression `%s'"), save);
9133 *input_line_pointer = c;
9134 }
9135 }
9136 }
9137 else
9138 expression (exp);
9139
9140 intel_syntax = -intel_syntax;
9141
9142 if (intel_syntax)
9143 i386_intel_simplify (exp);
9144
9145 return got_reloc;
9146 }
9147
9148 static void
9149 signed_cons (int size)
9150 {
9151 if (flag_code == CODE_64BIT)
9152 cons_sign = 1;
9153 cons (size);
9154 cons_sign = -1;
9155 }
9156
9157 #ifdef TE_PE
9158 static void
9159 pe_directive_secrel (int dummy ATTRIBUTE_UNUSED)
9160 {
9161 expressionS exp;
9162
9163 do
9164 {
9165 expression (&exp);
9166 if (exp.X_op == O_symbol)
9167 exp.X_op = O_secrel;
9168
9169 emit_expr (&exp, 4);
9170 }
9171 while (*input_line_pointer++ == ',');
9172
9173 input_line_pointer--;
9174 demand_empty_rest_of_line ();
9175 }
9176 #endif
9177
9178 /* Handle Vector operations. */
9179
9180 static char *
9181 check_VecOperations (char *op_string, char *op_end)
9182 {
9183 const reg_entry *mask;
9184 const char *saved;
9185 char *end_op;
9186
9187 while (*op_string
9188 && (op_end == NULL || op_string < op_end))
9189 {
9190 saved = op_string;
9191 if (*op_string == '{')
9192 {
9193 op_string++;
9194
9195 /* Check broadcasts. */
9196 if (strncmp (op_string, "1to", 3) == 0)
9197 {
9198 int bcst_type;
9199
9200 if (i.broadcast)
9201 goto duplicated_vec_op;
9202
9203 op_string += 3;
9204 if (*op_string == '8')
9205 bcst_type = 8;
9206 else if (*op_string == '4')
9207 bcst_type = 4;
9208 else if (*op_string == '2')
9209 bcst_type = 2;
9210 else if (*op_string == '1'
9211 && *(op_string+1) == '6')
9212 {
9213 bcst_type = 16;
9214 op_string++;
9215 }
9216 else
9217 {
9218 as_bad (_("Unsupported broadcast: `%s'"), saved);
9219 return NULL;
9220 }
9221 op_string++;
9222
9223 broadcast_op.type = bcst_type;
9224 broadcast_op.operand = this_operand;
9225 broadcast_op.bytes = 0;
9226 i.broadcast = &broadcast_op;
9227 }
9228 /* Check masking operation. */
9229 else if ((mask = parse_register (op_string, &end_op)) != NULL)
9230 {
9231 /* k0 can't be used for write mask. */
9232 if (mask->reg_type.bitfield.class != RegMask || !mask->reg_num)
9233 {
9234 as_bad (_("`%s%s' can't be used for write mask"),
9235 register_prefix, mask->reg_name);
9236 return NULL;
9237 }
9238
9239 if (!i.mask)
9240 {
9241 mask_op.mask = mask;
9242 mask_op.zeroing = 0;
9243 mask_op.operand = this_operand;
9244 i.mask = &mask_op;
9245 }
9246 else
9247 {
9248 if (i.mask->mask)
9249 goto duplicated_vec_op;
9250
9251 i.mask->mask = mask;
9252
9253 /* Only "{z}" is allowed here. No need to check
9254 zeroing mask explicitly. */
9255 if (i.mask->operand != this_operand)
9256 {
9257 as_bad (_("invalid write mask `%s'"), saved);
9258 return NULL;
9259 }
9260 }
9261
9262 op_string = end_op;
9263 }
9264 /* Check zeroing-flag for masking operation. */
9265 else if (*op_string == 'z')
9266 {
9267 if (!i.mask)
9268 {
9269 mask_op.mask = NULL;
9270 mask_op.zeroing = 1;
9271 mask_op.operand = this_operand;
9272 i.mask = &mask_op;
9273 }
9274 else
9275 {
9276 if (i.mask->zeroing)
9277 {
9278 duplicated_vec_op:
9279 as_bad (_("duplicated `%s'"), saved);
9280 return NULL;
9281 }
9282
9283 i.mask->zeroing = 1;
9284
9285 /* Only "{%k}" is allowed here. No need to check mask
9286 register explicitly. */
9287 if (i.mask->operand != this_operand)
9288 {
9289 as_bad (_("invalid zeroing-masking `%s'"),
9290 saved);
9291 return NULL;
9292 }
9293 }
9294
9295 op_string++;
9296 }
9297 else
9298 goto unknown_vec_op;
9299
9300 if (*op_string != '}')
9301 {
9302 as_bad (_("missing `}' in `%s'"), saved);
9303 return NULL;
9304 }
9305 op_string++;
9306
9307 /* Strip whitespace since the addition of pseudo prefixes
9308 changed how the scrubber treats '{'. */
9309 if (is_space_char (*op_string))
9310 ++op_string;
9311
9312 continue;
9313 }
9314 unknown_vec_op:
9315 /* We don't know this one. */
9316 as_bad (_("unknown vector operation: `%s'"), saved);
9317 return NULL;
9318 }
9319
9320 if (i.mask && i.mask->zeroing && !i.mask->mask)
9321 {
9322 as_bad (_("zeroing-masking only allowed with write mask"));
9323 return NULL;
9324 }
9325
9326 return op_string;
9327 }
9328
9329 static int
9330 i386_immediate (char *imm_start)
9331 {
9332 char *save_input_line_pointer;
9333 char *gotfree_input_line;
9334 segT exp_seg = 0;
9335 expressionS *exp;
9336 i386_operand_type types;
9337
9338 operand_type_set (&types, ~0);
9339
9340 if (i.imm_operands == MAX_IMMEDIATE_OPERANDS)
9341 {
9342 as_bad (_("at most %d immediate operands are allowed"),
9343 MAX_IMMEDIATE_OPERANDS);
9344 return 0;
9345 }
9346
9347 exp = &im_expressions[i.imm_operands++];
9348 i.op[this_operand].imms = exp;
9349
9350 if (is_space_char (*imm_start))
9351 ++imm_start;
9352
9353 save_input_line_pointer = input_line_pointer;
9354 input_line_pointer = imm_start;
9355
9356 gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
9357 if (gotfree_input_line)
9358 input_line_pointer = gotfree_input_line;
9359
9360 exp_seg = expression (exp);
9361
9362 SKIP_WHITESPACE ();
9363
9364 /* Handle vector operations. */
9365 if (*input_line_pointer == '{')
9366 {
9367 input_line_pointer = check_VecOperations (input_line_pointer,
9368 NULL);
9369 if (input_line_pointer == NULL)
9370 return 0;
9371 }
9372
9373 if (*input_line_pointer)
9374 as_bad (_("junk `%s' after expression"), input_line_pointer);
9375
9376 input_line_pointer = save_input_line_pointer;
9377 if (gotfree_input_line)
9378 {
9379 free (gotfree_input_line);
9380
9381 if (exp->X_op == O_constant || exp->X_op == O_register)
9382 exp->X_op = O_illegal;
9383 }
9384
9385 return i386_finalize_immediate (exp_seg, exp, types, imm_start);
9386 }
9387
9388 static int
9389 i386_finalize_immediate (segT exp_seg ATTRIBUTE_UNUSED, expressionS *exp,
9390 i386_operand_type types, const char *imm_start)
9391 {
9392 if (exp->X_op == O_absent || exp->X_op == O_illegal || exp->X_op == O_big)
9393 {
9394 if (imm_start)
9395 as_bad (_("missing or invalid immediate expression `%s'"),
9396 imm_start);
9397 return 0;
9398 }
9399 else if (exp->X_op == O_constant)
9400 {
9401 /* Size it properly later. */
9402 i.types[this_operand].bitfield.imm64 = 1;
9403 /* If not 64bit, sign extend val. */
9404 if (flag_code != CODE_64BIT
9405 && (exp->X_add_number & ~(((addressT) 2 << 31) - 1)) == 0)
9406 exp->X_add_number
9407 = (exp->X_add_number ^ ((addressT) 1 << 31)) - ((addressT) 1 << 31);
9408 }
9409 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
9410 else if (OUTPUT_FLAVOR == bfd_target_aout_flavour
9411 && exp_seg != absolute_section
9412 && exp_seg != text_section
9413 && exp_seg != data_section
9414 && exp_seg != bss_section
9415 && exp_seg != undefined_section
9416 && !bfd_is_com_section (exp_seg))
9417 {
9418 as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
9419 return 0;
9420 }
9421 #endif
9422 else if (!intel_syntax && exp_seg == reg_section)
9423 {
9424 if (imm_start)
9425 as_bad (_("illegal immediate register operand %s"), imm_start);
9426 return 0;
9427 }
9428 else
9429 {
9430 /* This is an address. The size of the address will be
9431 determined later, depending on destination register,
9432 suffix, or the default for the section. */
9433 i.types[this_operand].bitfield.imm8 = 1;
9434 i.types[this_operand].bitfield.imm16 = 1;
9435 i.types[this_operand].bitfield.imm32 = 1;
9436 i.types[this_operand].bitfield.imm32s = 1;
9437 i.types[this_operand].bitfield.imm64 = 1;
9438 i.types[this_operand] = operand_type_and (i.types[this_operand],
9439 types);
9440 }
9441
9442 return 1;
9443 }
9444
9445 static char *
9446 i386_scale (char *scale)
9447 {
9448 offsetT val;
9449 char *save = input_line_pointer;
9450
9451 input_line_pointer = scale;
9452 val = get_absolute_expression ();
9453
9454 switch (val)
9455 {
9456 case 1:
9457 i.log2_scale_factor = 0;
9458 break;
9459 case 2:
9460 i.log2_scale_factor = 1;
9461 break;
9462 case 4:
9463 i.log2_scale_factor = 2;
9464 break;
9465 case 8:
9466 i.log2_scale_factor = 3;
9467 break;
9468 default:
9469 {
9470 char sep = *input_line_pointer;
9471
9472 *input_line_pointer = '\0';
9473 as_bad (_("expecting scale factor of 1, 2, 4, or 8: got `%s'"),
9474 scale);
9475 *input_line_pointer = sep;
9476 input_line_pointer = save;
9477 return NULL;
9478 }
9479 }
9480 if (i.log2_scale_factor != 0 && i.index_reg == 0)
9481 {
9482 as_warn (_("scale factor of %d without an index register"),
9483 1 << i.log2_scale_factor);
9484 i.log2_scale_factor = 0;
9485 }
9486 scale = input_line_pointer;
9487 input_line_pointer = save;
9488 return scale;
9489 }
9490
9491 static int
9492 i386_displacement (char *disp_start, char *disp_end)
9493 {
9494 expressionS *exp;
9495 segT exp_seg = 0;
9496 char *save_input_line_pointer;
9497 char *gotfree_input_line;
9498 int override;
9499 i386_operand_type bigdisp, types = anydisp;
9500 int ret;
9501
9502 if (i.disp_operands == MAX_MEMORY_OPERANDS)
9503 {
9504 as_bad (_("at most %d displacement operands are allowed"),
9505 MAX_MEMORY_OPERANDS);
9506 return 0;
9507 }
9508
9509 operand_type_set (&bigdisp, 0);
9510 if ((i.types[this_operand].bitfield.jumpabsolute)
9511 || (!current_templates->start->opcode_modifier.jump
9512 && !current_templates->start->opcode_modifier.jumpdword))
9513 {
9514 bigdisp.bitfield.disp32 = 1;
9515 override = (i.prefix[ADDR_PREFIX] != 0);
9516 if (flag_code == CODE_64BIT)
9517 {
9518 if (!override)
9519 {
9520 bigdisp.bitfield.disp32s = 1;
9521 bigdisp.bitfield.disp64 = 1;
9522 }
9523 }
9524 else if ((flag_code == CODE_16BIT) ^ override)
9525 {
9526 bigdisp.bitfield.disp32 = 0;
9527 bigdisp.bitfield.disp16 = 1;
9528 }
9529 }
9530 else
9531 {
9532 /* For PC-relative branches, the width of the displacement
9533 is dependent upon data size, not address size. */
9534 override = (i.prefix[DATA_PREFIX] != 0);
9535 if (flag_code == CODE_64BIT)
9536 {
9537 if (override || i.suffix == WORD_MNEM_SUFFIX)
9538 bigdisp.bitfield.disp16 = 1;
9539 else
9540 {
9541 bigdisp.bitfield.disp32 = 1;
9542 bigdisp.bitfield.disp32s = 1;
9543 }
9544 }
9545 else
9546 {
9547 if (!override)
9548 override = (i.suffix == (flag_code != CODE_16BIT
9549 ? WORD_MNEM_SUFFIX
9550 : LONG_MNEM_SUFFIX));
9551 bigdisp.bitfield.disp32 = 1;
9552 if ((flag_code == CODE_16BIT) ^ override)
9553 {
9554 bigdisp.bitfield.disp32 = 0;
9555 bigdisp.bitfield.disp16 = 1;
9556 }
9557 }
9558 }
9559 i.types[this_operand] = operand_type_or (i.types[this_operand],
9560 bigdisp);
9561
9562 exp = &disp_expressions[i.disp_operands];
9563 i.op[this_operand].disps = exp;
9564 i.disp_operands++;
9565 save_input_line_pointer = input_line_pointer;
9566 input_line_pointer = disp_start;
9567 END_STRING_AND_SAVE (disp_end);
9568
9569 #ifndef GCC_ASM_O_HACK
9570 #define GCC_ASM_O_HACK 0
9571 #endif
9572 #if GCC_ASM_O_HACK
9573 END_STRING_AND_SAVE (disp_end + 1);
9574 if (i.types[this_operand].bitfield.baseIndex
9575 && displacement_string_end[-1] == '+')
9576 {
9577 /* This hack is to avoid a warning when using the "o"
9578 constraint within gcc asm statements.
9579 For instance:
9580
9581 #define _set_tssldt_desc(n,addr,limit,type) \
9582 __asm__ __volatile__ ( \
9583 "movw %w2,%0\n\t" \
9584 "movw %w1,2+%0\n\t" \
9585 "rorl $16,%1\n\t" \
9586 "movb %b1,4+%0\n\t" \
9587 "movb %4,5+%0\n\t" \
9588 "movb $0,6+%0\n\t" \
9589 "movb %h1,7+%0\n\t" \
9590 "rorl $16,%1" \
9591 : "=o"(*(n)) : "q" (addr), "ri"(limit), "i"(type))
9592
9593 This works great except that the output assembler ends
9594 up looking a bit weird if it turns out that there is
9595 no offset. You end up producing code that looks like:
9596
9597 #APP
9598 movw $235,(%eax)
9599 movw %dx,2+(%eax)
9600 rorl $16,%edx
9601 movb %dl,4+(%eax)
9602 movb $137,5+(%eax)
9603 movb $0,6+(%eax)
9604 movb %dh,7+(%eax)
9605 rorl $16,%edx
9606 #NO_APP
9607
9608 So here we provide the missing zero. */
9609
9610 *displacement_string_end = '0';
9611 }
9612 #endif
9613 gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
9614 if (gotfree_input_line)
9615 input_line_pointer = gotfree_input_line;
9616
9617 exp_seg = expression (exp);
9618
9619 SKIP_WHITESPACE ();
9620 if (*input_line_pointer)
9621 as_bad (_("junk `%s' after expression"), input_line_pointer);
9622 #if GCC_ASM_O_HACK
9623 RESTORE_END_STRING (disp_end + 1);
9624 #endif
9625 input_line_pointer = save_input_line_pointer;
9626 if (gotfree_input_line)
9627 {
9628 free (gotfree_input_line);
9629
9630 if (exp->X_op == O_constant || exp->X_op == O_register)
9631 exp->X_op = O_illegal;
9632 }
9633
9634 ret = i386_finalize_displacement (exp_seg, exp, types, disp_start);
9635
9636 RESTORE_END_STRING (disp_end);
9637
9638 return ret;
9639 }
9640
9641 static int
9642 i386_finalize_displacement (segT exp_seg ATTRIBUTE_UNUSED, expressionS *exp,
9643 i386_operand_type types, const char *disp_start)
9644 {
9645 i386_operand_type bigdisp;
9646 int ret = 1;
9647
9648 /* We do this to make sure that the section symbol is in
9649 the symbol table. We will ultimately change the relocation
9650 to be relative to the beginning of the section. */
9651 if (i.reloc[this_operand] == BFD_RELOC_386_GOTOFF
9652 || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL
9653 || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
9654 {
9655 if (exp->X_op != O_symbol)
9656 goto inv_disp;
9657
9658 if (S_IS_LOCAL (exp->X_add_symbol)
9659 && S_GET_SEGMENT (exp->X_add_symbol) != undefined_section
9660 && S_GET_SEGMENT (exp->X_add_symbol) != expr_section)
9661 section_symbol (S_GET_SEGMENT (exp->X_add_symbol));
9662 exp->X_op = O_subtract;
9663 exp->X_op_symbol = GOT_symbol;
9664 if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL)
9665 i.reloc[this_operand] = BFD_RELOC_32_PCREL;
9666 else if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
9667 i.reloc[this_operand] = BFD_RELOC_64;
9668 else
9669 i.reloc[this_operand] = BFD_RELOC_32;
9670 }
9671
9672 else if (exp->X_op == O_absent
9673 || exp->X_op == O_illegal
9674 || exp->X_op == O_big)
9675 {
9676 inv_disp:
9677 as_bad (_("missing or invalid displacement expression `%s'"),
9678 disp_start);
9679 ret = 0;
9680 }
9681
9682 else if (flag_code == CODE_64BIT
9683 && !i.prefix[ADDR_PREFIX]
9684 && exp->X_op == O_constant)
9685 {
9686 /* Since displacement is signed extended to 64bit, don't allow
9687 disp32 and turn off disp32s if they are out of range. */
9688 i.types[this_operand].bitfield.disp32 = 0;
9689 if (!fits_in_signed_long (exp->X_add_number))
9690 {
9691 i.types[this_operand].bitfield.disp32s = 0;
9692 if (i.types[this_operand].bitfield.baseindex)
9693 {
9694 as_bad (_("0x%lx out range of signed 32bit displacement"),
9695 (long) exp->X_add_number);
9696 ret = 0;
9697 }
9698 }
9699 }
9700
9701 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
9702 else if (exp->X_op != O_constant
9703 && OUTPUT_FLAVOR == bfd_target_aout_flavour
9704 && exp_seg != absolute_section
9705 && exp_seg != text_section
9706 && exp_seg != data_section
9707 && exp_seg != bss_section
9708 && exp_seg != undefined_section
9709 && !bfd_is_com_section (exp_seg))
9710 {
9711 as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
9712 ret = 0;
9713 }
9714 #endif
9715
9716 /* Check if this is a displacement only operand. */
9717 bigdisp = i.types[this_operand];
9718 bigdisp.bitfield.disp8 = 0;
9719 bigdisp.bitfield.disp16 = 0;
9720 bigdisp.bitfield.disp32 = 0;
9721 bigdisp.bitfield.disp32s = 0;
9722 bigdisp.bitfield.disp64 = 0;
9723 if (operand_type_all_zero (&bigdisp))
9724 i.types[this_operand] = operand_type_and (i.types[this_operand],
9725 types);
9726
9727 return ret;
9728 }
9729
9730 /* Return the active addressing mode, taking address override and
9731 registers forming the address into consideration. Update the
9732 address override prefix if necessary. */
9733
9734 static enum flag_code
9735 i386_addressing_mode (void)
9736 {
9737 enum flag_code addr_mode;
9738
9739 if (i.prefix[ADDR_PREFIX])
9740 addr_mode = flag_code == CODE_32BIT ? CODE_16BIT : CODE_32BIT;
9741 else
9742 {
9743 addr_mode = flag_code;
9744
9745 #if INFER_ADDR_PREFIX
9746 if (i.mem_operands == 0)
9747 {
9748 /* Infer address prefix from the first memory operand. */
9749 const reg_entry *addr_reg = i.base_reg;
9750
9751 if (addr_reg == NULL)
9752 addr_reg = i.index_reg;
9753
9754 if (addr_reg)
9755 {
9756 if (addr_reg->reg_type.bitfield.dword)
9757 addr_mode = CODE_32BIT;
9758 else if (flag_code != CODE_64BIT
9759 && addr_reg->reg_type.bitfield.word)
9760 addr_mode = CODE_16BIT;
9761
9762 if (addr_mode != flag_code)
9763 {
9764 i.prefix[ADDR_PREFIX] = ADDR_PREFIX_OPCODE;
9765 i.prefixes += 1;
9766 /* Change the size of any displacement too. At most one
9767 of Disp16 or Disp32 is set.
9768 FIXME. There doesn't seem to be any real need for
9769 separate Disp16 and Disp32 flags. The same goes for
9770 Imm16 and Imm32. Removing them would probably clean
9771 up the code quite a lot. */
9772 if (flag_code != CODE_64BIT
9773 && (i.types[this_operand].bitfield.disp16
9774 || i.types[this_operand].bitfield.disp32))
9775 i.types[this_operand]
9776 = operand_type_xor (i.types[this_operand], disp16_32);
9777 }
9778 }
9779 }
9780 #endif
9781 }
9782
9783 return addr_mode;
9784 }
9785
9786 /* Make sure the memory operand we've been dealt is valid.
9787 Return 1 on success, 0 on a failure. */
9788
9789 static int
9790 i386_index_check (const char *operand_string)
9791 {
9792 const char *kind = "base/index";
9793 enum flag_code addr_mode = i386_addressing_mode ();
9794
9795 if (current_templates->start->opcode_modifier.isstring
9796 && !current_templates->start->cpu_flags.bitfield.cpupadlock
9797 && (current_templates->end[-1].opcode_modifier.isstring
9798 || i.mem_operands))
9799 {
9800 /* Memory operands of string insns are special in that they only allow
9801 a single register (rDI, rSI, or rBX) as their memory address. */
9802 const reg_entry *expected_reg;
9803 static const char *di_si[][2] =
9804 {
9805 { "esi", "edi" },
9806 { "si", "di" },
9807 { "rsi", "rdi" }
9808 };
9809 static const char *bx[] = { "ebx", "bx", "rbx" };
9810
9811 kind = "string address";
9812
9813 if (current_templates->start->opcode_modifier.repprefixok)
9814 {
9815 i386_operand_type type = current_templates->end[-1].operand_types[0];
9816
9817 if (!type.bitfield.baseindex
9818 || ((!i.mem_operands != !intel_syntax)
9819 && current_templates->end[-1].operand_types[1]
9820 .bitfield.baseindex))
9821 type = current_templates->end[-1].operand_types[1];
9822 expected_reg = hash_find (reg_hash,
9823 di_si[addr_mode][type.bitfield.esseg]);
9824
9825 }
9826 else
9827 expected_reg = hash_find (reg_hash, bx[addr_mode]);
9828
9829 if (i.base_reg != expected_reg
9830 || i.index_reg
9831 || operand_type_check (i.types[this_operand], disp))
9832 {
9833 /* The second memory operand must have the same size as
9834 the first one. */
9835 if (i.mem_operands
9836 && i.base_reg
9837 && !((addr_mode == CODE_64BIT
9838 && i.base_reg->reg_type.bitfield.qword)
9839 || (addr_mode == CODE_32BIT
9840 ? i.base_reg->reg_type.bitfield.dword
9841 : i.base_reg->reg_type.bitfield.word)))
9842 goto bad_address;
9843
9844 as_warn (_("`%s' is not valid here (expected `%c%s%s%c')"),
9845 operand_string,
9846 intel_syntax ? '[' : '(',
9847 register_prefix,
9848 expected_reg->reg_name,
9849 intel_syntax ? ']' : ')');
9850 return 1;
9851 }
9852 else
9853 return 1;
9854
9855 bad_address:
9856 as_bad (_("`%s' is not a valid %s expression"),
9857 operand_string, kind);
9858 return 0;
9859 }
9860 else
9861 {
9862 if (addr_mode != CODE_16BIT)
9863 {
9864 /* 32-bit/64-bit checks. */
9865 if ((i.base_reg
9866 && ((addr_mode == CODE_64BIT
9867 ? !i.base_reg->reg_type.bitfield.qword
9868 : !i.base_reg->reg_type.bitfield.dword)
9869 || (i.index_reg && i.base_reg->reg_num == RegIP)
9870 || i.base_reg->reg_num == RegIZ))
9871 || (i.index_reg
9872 && !i.index_reg->reg_type.bitfield.xmmword
9873 && !i.index_reg->reg_type.bitfield.ymmword
9874 && !i.index_reg->reg_type.bitfield.zmmword
9875 && ((addr_mode == CODE_64BIT
9876 ? !i.index_reg->reg_type.bitfield.qword
9877 : !i.index_reg->reg_type.bitfield.dword)
9878 || !i.index_reg->reg_type.bitfield.baseindex)))
9879 goto bad_address;
9880
9881 /* bndmk, bndldx, and bndstx have special restrictions. */
9882 if (current_templates->start->base_opcode == 0xf30f1b
9883 || (current_templates->start->base_opcode & ~1) == 0x0f1a)
9884 {
9885 /* They cannot use RIP-relative addressing. */
9886 if (i.base_reg && i.base_reg->reg_num == RegIP)
9887 {
9888 as_bad (_("`%s' cannot be used here"), operand_string);
9889 return 0;
9890 }
9891
9892 /* bndldx and bndstx ignore their scale factor. */
9893 if (current_templates->start->base_opcode != 0xf30f1b
9894 && i.log2_scale_factor)
9895 as_warn (_("register scaling is being ignored here"));
9896 }
9897 }
9898 else
9899 {
9900 /* 16-bit checks. */
9901 if ((i.base_reg
9902 && (!i.base_reg->reg_type.bitfield.word
9903 || !i.base_reg->reg_type.bitfield.baseindex))
9904 || (i.index_reg
9905 && (!i.index_reg->reg_type.bitfield.word
9906 || !i.index_reg->reg_type.bitfield.baseindex
9907 || !(i.base_reg
9908 && i.base_reg->reg_num < 6
9909 && i.index_reg->reg_num >= 6
9910 && i.log2_scale_factor == 0))))
9911 goto bad_address;
9912 }
9913 }
9914 return 1;
9915 }
9916
9917 /* Handle vector immediates. */
9918
9919 static int
9920 RC_SAE_immediate (const char *imm_start)
9921 {
9922 unsigned int match_found, j;
9923 const char *pstr = imm_start;
9924 expressionS *exp;
9925
9926 if (*pstr != '{')
9927 return 0;
9928
9929 pstr++;
9930 match_found = 0;
9931 for (j = 0; j < ARRAY_SIZE (RC_NamesTable); j++)
9932 {
9933 if (!strncmp (pstr, RC_NamesTable[j].name, RC_NamesTable[j].len))
9934 {
9935 if (!i.rounding)
9936 {
9937 rc_op.type = RC_NamesTable[j].type;
9938 rc_op.operand = this_operand;
9939 i.rounding = &rc_op;
9940 }
9941 else
9942 {
9943 as_bad (_("duplicated `%s'"), imm_start);
9944 return 0;
9945 }
9946 pstr += RC_NamesTable[j].len;
9947 match_found = 1;
9948 break;
9949 }
9950 }
9951 if (!match_found)
9952 return 0;
9953
9954 if (*pstr++ != '}')
9955 {
9956 as_bad (_("Missing '}': '%s'"), imm_start);
9957 return 0;
9958 }
9959 /* RC/SAE immediate string should contain nothing more. */;
9960 if (*pstr != 0)
9961 {
9962 as_bad (_("Junk after '}': '%s'"), imm_start);
9963 return 0;
9964 }
9965
9966 exp = &im_expressions[i.imm_operands++];
9967 i.op[this_operand].imms = exp;
9968
9969 exp->X_op = O_constant;
9970 exp->X_add_number = 0;
9971 exp->X_add_symbol = (symbolS *) 0;
9972 exp->X_op_symbol = (symbolS *) 0;
9973
9974 i.types[this_operand].bitfield.imm8 = 1;
9975 return 1;
9976 }
9977
9978 /* Only string instructions can have a second memory operand, so
9979 reduce current_templates to just those if it contains any. */
9980 static int
9981 maybe_adjust_templates (void)
9982 {
9983 const insn_template *t;
9984
9985 gas_assert (i.mem_operands == 1);
9986
9987 for (t = current_templates->start; t < current_templates->end; ++t)
9988 if (t->opcode_modifier.isstring)
9989 break;
9990
9991 if (t < current_templates->end)
9992 {
9993 static templates aux_templates;
9994 bfd_boolean recheck;
9995
9996 aux_templates.start = t;
9997 for (; t < current_templates->end; ++t)
9998 if (!t->opcode_modifier.isstring)
9999 break;
10000 aux_templates.end = t;
10001
10002 /* Determine whether to re-check the first memory operand. */
10003 recheck = (aux_templates.start != current_templates->start
10004 || t != current_templates->end);
10005
10006 current_templates = &aux_templates;
10007
10008 if (recheck)
10009 {
10010 i.mem_operands = 0;
10011 if (i.memop1_string != NULL
10012 && i386_index_check (i.memop1_string) == 0)
10013 return 0;
10014 i.mem_operands = 1;
10015 }
10016 }
10017
10018 return 1;
10019 }
10020
10021 /* Parse OPERAND_STRING into the i386_insn structure I. Returns zero
10022 on error. */
10023
10024 static int
10025 i386_att_operand (char *operand_string)
10026 {
10027 const reg_entry *r;
10028 char *end_op;
10029 char *op_string = operand_string;
10030
10031 if (is_space_char (*op_string))
10032 ++op_string;
10033
10034 /* We check for an absolute prefix (differentiating,
10035 for example, 'jmp pc_relative_label' from 'jmp *absolute_label'. */
10036 if (*op_string == ABSOLUTE_PREFIX)
10037 {
10038 ++op_string;
10039 if (is_space_char (*op_string))
10040 ++op_string;
10041 i.types[this_operand].bitfield.jumpabsolute = 1;
10042 }
10043
10044 /* Check if operand is a register. */
10045 if ((r = parse_register (op_string, &end_op)) != NULL)
10046 {
10047 i386_operand_type temp;
10048
10049 /* Check for a segment override by searching for ':' after a
10050 segment register. */
10051 op_string = end_op;
10052 if (is_space_char (*op_string))
10053 ++op_string;
10054 if (*op_string == ':' && r->reg_type.bitfield.class == SReg)
10055 {
10056 switch (r->reg_num)
10057 {
10058 case 0:
10059 i.seg[i.mem_operands] = &es;
10060 break;
10061 case 1:
10062 i.seg[i.mem_operands] = &cs;
10063 break;
10064 case 2:
10065 i.seg[i.mem_operands] = &ss;
10066 break;
10067 case 3:
10068 i.seg[i.mem_operands] = &ds;
10069 break;
10070 case 4:
10071 i.seg[i.mem_operands] = &fs;
10072 break;
10073 case 5:
10074 i.seg[i.mem_operands] = &gs;
10075 break;
10076 }
10077
10078 /* Skip the ':' and whitespace. */
10079 ++op_string;
10080 if (is_space_char (*op_string))
10081 ++op_string;
10082
10083 if (!is_digit_char (*op_string)
10084 && !is_identifier_char (*op_string)
10085 && *op_string != '('
10086 && *op_string != ABSOLUTE_PREFIX)
10087 {
10088 as_bad (_("bad memory operand `%s'"), op_string);
10089 return 0;
10090 }
10091 /* Handle case of %es:*foo. */
10092 if (*op_string == ABSOLUTE_PREFIX)
10093 {
10094 ++op_string;
10095 if (is_space_char (*op_string))
10096 ++op_string;
10097 i.types[this_operand].bitfield.jumpabsolute = 1;
10098 }
10099 goto do_memory_reference;
10100 }
10101
10102 /* Handle vector operations. */
10103 if (*op_string == '{')
10104 {
10105 op_string = check_VecOperations (op_string, NULL);
10106 if (op_string == NULL)
10107 return 0;
10108 }
10109
10110 if (*op_string)
10111 {
10112 as_bad (_("junk `%s' after register"), op_string);
10113 return 0;
10114 }
10115 temp = r->reg_type;
10116 temp.bitfield.baseindex = 0;
10117 i.types[this_operand] = operand_type_or (i.types[this_operand],
10118 temp);
10119 i.types[this_operand].bitfield.unspecified = 0;
10120 i.op[this_operand].regs = r;
10121 i.reg_operands++;
10122 }
10123 else if (*op_string == REGISTER_PREFIX)
10124 {
10125 as_bad (_("bad register name `%s'"), op_string);
10126 return 0;
10127 }
10128 else if (*op_string == IMMEDIATE_PREFIX)
10129 {
10130 ++op_string;
10131 if (i.types[this_operand].bitfield.jumpabsolute)
10132 {
10133 as_bad (_("immediate operand illegal with absolute jump"));
10134 return 0;
10135 }
10136 if (!i386_immediate (op_string))
10137 return 0;
10138 }
10139 else if (RC_SAE_immediate (operand_string))
10140 {
10141 /* If it is a RC or SAE immediate, do nothing. */
10142 ;
10143 }
10144 else if (is_digit_char (*op_string)
10145 || is_identifier_char (*op_string)
10146 || *op_string == '"'
10147 || *op_string == '(')
10148 {
10149 /* This is a memory reference of some sort. */
10150 char *base_string;
10151
10152 /* Start and end of displacement string expression (if found). */
10153 char *displacement_string_start;
10154 char *displacement_string_end;
10155 char *vop_start;
10156
10157 do_memory_reference:
10158 if (i.mem_operands == 1 && !maybe_adjust_templates ())
10159 return 0;
10160 if ((i.mem_operands == 1
10161 && !current_templates->start->opcode_modifier.isstring)
10162 || i.mem_operands == 2)
10163 {
10164 as_bad (_("too many memory references for `%s'"),
10165 current_templates->start->name);
10166 return 0;
10167 }
10168
10169 /* Check for base index form. We detect the base index form by
10170 looking for an ')' at the end of the operand, searching
10171 for the '(' matching it, and finding a REGISTER_PREFIX or ','
10172 after the '('. */
10173 base_string = op_string + strlen (op_string);
10174
10175 /* Handle vector operations. */
10176 vop_start = strchr (op_string, '{');
10177 if (vop_start && vop_start < base_string)
10178 {
10179 if (check_VecOperations (vop_start, base_string) == NULL)
10180 return 0;
10181 base_string = vop_start;
10182 }
10183
10184 --base_string;
10185 if (is_space_char (*base_string))
10186 --base_string;
10187
10188 /* If we only have a displacement, set-up for it to be parsed later. */
10189 displacement_string_start = op_string;
10190 displacement_string_end = base_string + 1;
10191
10192 if (*base_string == ')')
10193 {
10194 char *temp_string;
10195 unsigned int parens_balanced = 1;
10196 /* We've already checked that the number of left & right ()'s are
10197 equal, so this loop will not be infinite. */
10198 do
10199 {
10200 base_string--;
10201 if (*base_string == ')')
10202 parens_balanced++;
10203 if (*base_string == '(')
10204 parens_balanced--;
10205 }
10206 while (parens_balanced);
10207
10208 temp_string = base_string;
10209
10210 /* Skip past '(' and whitespace. */
10211 ++base_string;
10212 if (is_space_char (*base_string))
10213 ++base_string;
10214
10215 if (*base_string == ','
10216 || ((i.base_reg = parse_register (base_string, &end_op))
10217 != NULL))
10218 {
10219 displacement_string_end = temp_string;
10220
10221 i.types[this_operand].bitfield.baseindex = 1;
10222
10223 if (i.base_reg)
10224 {
10225 base_string = end_op;
10226 if (is_space_char (*base_string))
10227 ++base_string;
10228 }
10229
10230 /* There may be an index reg or scale factor here. */
10231 if (*base_string == ',')
10232 {
10233 ++base_string;
10234 if (is_space_char (*base_string))
10235 ++base_string;
10236
10237 if ((i.index_reg = parse_register (base_string, &end_op))
10238 != NULL)
10239 {
10240 base_string = end_op;
10241 if (is_space_char (*base_string))
10242 ++base_string;
10243 if (*base_string == ',')
10244 {
10245 ++base_string;
10246 if (is_space_char (*base_string))
10247 ++base_string;
10248 }
10249 else if (*base_string != ')')
10250 {
10251 as_bad (_("expecting `,' or `)' "
10252 "after index register in `%s'"),
10253 operand_string);
10254 return 0;
10255 }
10256 }
10257 else if (*base_string == REGISTER_PREFIX)
10258 {
10259 end_op = strchr (base_string, ',');
10260 if (end_op)
10261 *end_op = '\0';
10262 as_bad (_("bad register name `%s'"), base_string);
10263 return 0;
10264 }
10265
10266 /* Check for scale factor. */
10267 if (*base_string != ')')
10268 {
10269 char *end_scale = i386_scale (base_string);
10270
10271 if (!end_scale)
10272 return 0;
10273
10274 base_string = end_scale;
10275 if (is_space_char (*base_string))
10276 ++base_string;
10277 if (*base_string != ')')
10278 {
10279 as_bad (_("expecting `)' "
10280 "after scale factor in `%s'"),
10281 operand_string);
10282 return 0;
10283 }
10284 }
10285 else if (!i.index_reg)
10286 {
10287 as_bad (_("expecting index register or scale factor "
10288 "after `,'; got '%c'"),
10289 *base_string);
10290 return 0;
10291 }
10292 }
10293 else if (*base_string != ')')
10294 {
10295 as_bad (_("expecting `,' or `)' "
10296 "after base register in `%s'"),
10297 operand_string);
10298 return 0;
10299 }
10300 }
10301 else if (*base_string == REGISTER_PREFIX)
10302 {
10303 end_op = strchr (base_string, ',');
10304 if (end_op)
10305 *end_op = '\0';
10306 as_bad (_("bad register name `%s'"), base_string);
10307 return 0;
10308 }
10309 }
10310
10311 /* If there's an expression beginning the operand, parse it,
10312 assuming displacement_string_start and
10313 displacement_string_end are meaningful. */
10314 if (displacement_string_start != displacement_string_end)
10315 {
10316 if (!i386_displacement (displacement_string_start,
10317 displacement_string_end))
10318 return 0;
10319 }
10320
10321 /* Special case for (%dx) while doing input/output op. */
10322 if (i.base_reg
10323 && i.base_reg->reg_type.bitfield.inoutportreg
10324 && i.index_reg == 0
10325 && i.log2_scale_factor == 0
10326 && i.seg[i.mem_operands] == 0
10327 && !operand_type_check (i.types[this_operand], disp))
10328 {
10329 i.types[this_operand] = i.base_reg->reg_type;
10330 return 1;
10331 }
10332
10333 if (i386_index_check (operand_string) == 0)
10334 return 0;
10335 i.flags[this_operand] |= Operand_Mem;
10336 if (i.mem_operands == 0)
10337 i.memop1_string = xstrdup (operand_string);
10338 i.mem_operands++;
10339 }
10340 else
10341 {
10342 /* It's not a memory operand; argh! */
10343 as_bad (_("invalid char %s beginning operand %d `%s'"),
10344 output_invalid (*op_string),
10345 this_operand + 1,
10346 op_string);
10347 return 0;
10348 }
10349 return 1; /* Normal return. */
10350 }
10351 \f
10352 /* Calculate the maximum variable size (i.e., excluding fr_fix)
10353 that an rs_machine_dependent frag may reach. */
10354
10355 unsigned int
10356 i386_frag_max_var (fragS *frag)
10357 {
10358 /* The only relaxable frags are for jumps.
10359 Unconditional jumps can grow by 4 bytes and others by 5 bytes. */
10360 gas_assert (frag->fr_type == rs_machine_dependent);
10361 return TYPE_FROM_RELAX_STATE (frag->fr_subtype) == UNCOND_JUMP ? 4 : 5;
10362 }
10363
10364 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
10365 static int
10366 elf_symbol_resolved_in_segment_p (symbolS *fr_symbol, offsetT fr_var)
10367 {
10368 /* STT_GNU_IFUNC symbol must go through PLT. */
10369 if ((symbol_get_bfdsym (fr_symbol)->flags
10370 & BSF_GNU_INDIRECT_FUNCTION) != 0)
10371 return 0;
10372
10373 if (!S_IS_EXTERNAL (fr_symbol))
10374 /* Symbol may be weak or local. */
10375 return !S_IS_WEAK (fr_symbol);
10376
10377 /* Global symbols with non-default visibility can't be preempted. */
10378 if (ELF_ST_VISIBILITY (S_GET_OTHER (fr_symbol)) != STV_DEFAULT)
10379 return 1;
10380
10381 if (fr_var != NO_RELOC)
10382 switch ((enum bfd_reloc_code_real) fr_var)
10383 {
10384 case BFD_RELOC_386_PLT32:
10385 case BFD_RELOC_X86_64_PLT32:
10386 /* Symbol with PLT relocation may be preempted. */
10387 return 0;
10388 default:
10389 abort ();
10390 }
10391
10392 /* Global symbols with default visibility in a shared library may be
10393 preempted by another definition. */
10394 return !shared;
10395 }
10396 #endif
10397
10398 /* md_estimate_size_before_relax()
10399
10400 Called just before relax() for rs_machine_dependent frags. The x86
10401 assembler uses these frags to handle variable size jump
10402 instructions.
10403
10404 Any symbol that is now undefined will not become defined.
10405 Return the correct fr_subtype in the frag.
10406 Return the initial "guess for variable size of frag" to caller.
10407 The guess is actually the growth beyond the fixed part. Whatever
10408 we do to grow the fixed or variable part contributes to our
10409 returned value. */
10410
10411 int
10412 md_estimate_size_before_relax (fragS *fragP, segT segment)
10413 {
10414 /* We've already got fragP->fr_subtype right; all we have to do is
10415 check for un-relaxable symbols. On an ELF system, we can't relax
10416 an externally visible symbol, because it may be overridden by a
10417 shared library. */
10418 if (S_GET_SEGMENT (fragP->fr_symbol) != segment
10419 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
10420 || (IS_ELF
10421 && !elf_symbol_resolved_in_segment_p (fragP->fr_symbol,
10422 fragP->fr_var))
10423 #endif
10424 #if defined (OBJ_COFF) && defined (TE_PE)
10425 || (OUTPUT_FLAVOR == bfd_target_coff_flavour
10426 && S_IS_WEAK (fragP->fr_symbol))
10427 #endif
10428 )
10429 {
10430 /* Symbol is undefined in this segment, or we need to keep a
10431 reloc so that weak symbols can be overridden. */
10432 int size = (fragP->fr_subtype & CODE16) ? 2 : 4;
10433 enum bfd_reloc_code_real reloc_type;
10434 unsigned char *opcode;
10435 int old_fr_fix;
10436
10437 if (fragP->fr_var != NO_RELOC)
10438 reloc_type = (enum bfd_reloc_code_real) fragP->fr_var;
10439 else if (size == 2)
10440 reloc_type = BFD_RELOC_16_PCREL;
10441 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
10442 else if (need_plt32_p (fragP->fr_symbol))
10443 reloc_type = BFD_RELOC_X86_64_PLT32;
10444 #endif
10445 else
10446 reloc_type = BFD_RELOC_32_PCREL;
10447
10448 old_fr_fix = fragP->fr_fix;
10449 opcode = (unsigned char *) fragP->fr_opcode;
10450
10451 switch (TYPE_FROM_RELAX_STATE (fragP->fr_subtype))
10452 {
10453 case UNCOND_JUMP:
10454 /* Make jmp (0xeb) a (d)word displacement jump. */
10455 opcode[0] = 0xe9;
10456 fragP->fr_fix += size;
10457 fix_new (fragP, old_fr_fix, size,
10458 fragP->fr_symbol,
10459 fragP->fr_offset, 1,
10460 reloc_type);
10461 break;
10462
10463 case COND_JUMP86:
10464 if (size == 2
10465 && (!no_cond_jump_promotion || fragP->fr_var != NO_RELOC))
10466 {
10467 /* Negate the condition, and branch past an
10468 unconditional jump. */
10469 opcode[0] ^= 1;
10470 opcode[1] = 3;
10471 /* Insert an unconditional jump. */
10472 opcode[2] = 0xe9;
10473 /* We added two extra opcode bytes, and have a two byte
10474 offset. */
10475 fragP->fr_fix += 2 + 2;
10476 fix_new (fragP, old_fr_fix + 2, 2,
10477 fragP->fr_symbol,
10478 fragP->fr_offset, 1,
10479 reloc_type);
10480 break;
10481 }
10482 /* Fall through. */
10483
10484 case COND_JUMP:
10485 if (no_cond_jump_promotion && fragP->fr_var == NO_RELOC)
10486 {
10487 fixS *fixP;
10488
10489 fragP->fr_fix += 1;
10490 fixP = fix_new (fragP, old_fr_fix, 1,
10491 fragP->fr_symbol,
10492 fragP->fr_offset, 1,
10493 BFD_RELOC_8_PCREL);
10494 fixP->fx_signed = 1;
10495 break;
10496 }
10497
10498 /* This changes the byte-displacement jump 0x7N
10499 to the (d)word-displacement jump 0x0f,0x8N. */
10500 opcode[1] = opcode[0] + 0x10;
10501 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
10502 /* We've added an opcode byte. */
10503 fragP->fr_fix += 1 + size;
10504 fix_new (fragP, old_fr_fix + 1, size,
10505 fragP->fr_symbol,
10506 fragP->fr_offset, 1,
10507 reloc_type);
10508 break;
10509
10510 default:
10511 BAD_CASE (fragP->fr_subtype);
10512 break;
10513 }
10514 frag_wane (fragP);
10515 return fragP->fr_fix - old_fr_fix;
10516 }
10517
10518 /* Guess size depending on current relax state. Initially the relax
10519 state will correspond to a short jump and we return 1, because
10520 the variable part of the frag (the branch offset) is one byte
10521 long. However, we can relax a section more than once and in that
10522 case we must either set fr_subtype back to the unrelaxed state,
10523 or return the value for the appropriate branch. */
10524 return md_relax_table[fragP->fr_subtype].rlx_length;
10525 }
10526
10527 /* Called after relax() is finished.
10528
10529 In: Address of frag.
10530 fr_type == rs_machine_dependent.
10531 fr_subtype is what the address relaxed to.
10532
10533 Out: Any fixSs and constants are set up.
10534 Caller will turn frag into a ".space 0". */
10535
10536 void
10537 md_convert_frag (bfd *abfd ATTRIBUTE_UNUSED, segT sec ATTRIBUTE_UNUSED,
10538 fragS *fragP)
10539 {
10540 unsigned char *opcode;
10541 unsigned char *where_to_put_displacement = NULL;
10542 offsetT target_address;
10543 offsetT opcode_address;
10544 unsigned int extension = 0;
10545 offsetT displacement_from_opcode_start;
10546
10547 opcode = (unsigned char *) fragP->fr_opcode;
10548
10549 /* Address we want to reach in file space. */
10550 target_address = S_GET_VALUE (fragP->fr_symbol) + fragP->fr_offset;
10551
10552 /* Address opcode resides at in file space. */
10553 opcode_address = fragP->fr_address + fragP->fr_fix;
10554
10555 /* Displacement from opcode start to fill into instruction. */
10556 displacement_from_opcode_start = target_address - opcode_address;
10557
10558 if ((fragP->fr_subtype & BIG) == 0)
10559 {
10560 /* Don't have to change opcode. */
10561 extension = 1; /* 1 opcode + 1 displacement */
10562 where_to_put_displacement = &opcode[1];
10563 }
10564 else
10565 {
10566 if (no_cond_jump_promotion
10567 && TYPE_FROM_RELAX_STATE (fragP->fr_subtype) != UNCOND_JUMP)
10568 as_warn_where (fragP->fr_file, fragP->fr_line,
10569 _("long jump required"));
10570
10571 switch (fragP->fr_subtype)
10572 {
10573 case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG):
10574 extension = 4; /* 1 opcode + 4 displacement */
10575 opcode[0] = 0xe9;
10576 where_to_put_displacement = &opcode[1];
10577 break;
10578
10579 case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16):
10580 extension = 2; /* 1 opcode + 2 displacement */
10581 opcode[0] = 0xe9;
10582 where_to_put_displacement = &opcode[1];
10583 break;
10584
10585 case ENCODE_RELAX_STATE (COND_JUMP, BIG):
10586 case ENCODE_RELAX_STATE (COND_JUMP86, BIG):
10587 extension = 5; /* 2 opcode + 4 displacement */
10588 opcode[1] = opcode[0] + 0x10;
10589 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
10590 where_to_put_displacement = &opcode[2];
10591 break;
10592
10593 case ENCODE_RELAX_STATE (COND_JUMP, BIG16):
10594 extension = 3; /* 2 opcode + 2 displacement */
10595 opcode[1] = opcode[0] + 0x10;
10596 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
10597 where_to_put_displacement = &opcode[2];
10598 break;
10599
10600 case ENCODE_RELAX_STATE (COND_JUMP86, BIG16):
10601 extension = 4;
10602 opcode[0] ^= 1;
10603 opcode[1] = 3;
10604 opcode[2] = 0xe9;
10605 where_to_put_displacement = &opcode[3];
10606 break;
10607
10608 default:
10609 BAD_CASE (fragP->fr_subtype);
10610 break;
10611 }
10612 }
10613
10614 /* If size if less then four we are sure that the operand fits,
10615 but if it's 4, then it could be that the displacement is larger
10616 then -/+ 2GB. */
10617 if (DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype) == 4
10618 && object_64bit
10619 && ((addressT) (displacement_from_opcode_start - extension
10620 + ((addressT) 1 << 31))
10621 > (((addressT) 2 << 31) - 1)))
10622 {
10623 as_bad_where (fragP->fr_file, fragP->fr_line,
10624 _("jump target out of range"));
10625 /* Make us emit 0. */
10626 displacement_from_opcode_start = extension;
10627 }
10628 /* Now put displacement after opcode. */
10629 md_number_to_chars ((char *) where_to_put_displacement,
10630 (valueT) (displacement_from_opcode_start - extension),
10631 DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype));
10632 fragP->fr_fix += extension;
10633 }
10634 \f
10635 /* Apply a fixup (fixP) to segment data, once it has been determined
10636 by our caller that we have all the info we need to fix it up.
10637
10638 Parameter valP is the pointer to the value of the bits.
10639
10640 On the 386, immediates, displacements, and data pointers are all in
10641 the same (little-endian) format, so we don't need to care about which
10642 we are handling. */
10643
10644 void
10645 md_apply_fix (fixS *fixP, valueT *valP, segT seg ATTRIBUTE_UNUSED)
10646 {
10647 char *p = fixP->fx_where + fixP->fx_frag->fr_literal;
10648 valueT value = *valP;
10649
10650 #if !defined (TE_Mach)
10651 if (fixP->fx_pcrel)
10652 {
10653 switch (fixP->fx_r_type)
10654 {
10655 default:
10656 break;
10657
10658 case BFD_RELOC_64:
10659 fixP->fx_r_type = BFD_RELOC_64_PCREL;
10660 break;
10661 case BFD_RELOC_32:
10662 case BFD_RELOC_X86_64_32S:
10663 fixP->fx_r_type = BFD_RELOC_32_PCREL;
10664 break;
10665 case BFD_RELOC_16:
10666 fixP->fx_r_type = BFD_RELOC_16_PCREL;
10667 break;
10668 case BFD_RELOC_8:
10669 fixP->fx_r_type = BFD_RELOC_8_PCREL;
10670 break;
10671 }
10672 }
10673
10674 if (fixP->fx_addsy != NULL
10675 && (fixP->fx_r_type == BFD_RELOC_32_PCREL
10676 || fixP->fx_r_type == BFD_RELOC_64_PCREL
10677 || fixP->fx_r_type == BFD_RELOC_16_PCREL
10678 || fixP->fx_r_type == BFD_RELOC_8_PCREL)
10679 && !use_rela_relocations)
10680 {
10681 /* This is a hack. There should be a better way to handle this.
10682 This covers for the fact that bfd_install_relocation will
10683 subtract the current location (for partial_inplace, PC relative
10684 relocations); see more below. */
10685 #ifndef OBJ_AOUT
10686 if (IS_ELF
10687 #ifdef TE_PE
10688 || OUTPUT_FLAVOR == bfd_target_coff_flavour
10689 #endif
10690 )
10691 value += fixP->fx_where + fixP->fx_frag->fr_address;
10692 #endif
10693 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
10694 if (IS_ELF)
10695 {
10696 segT sym_seg = S_GET_SEGMENT (fixP->fx_addsy);
10697
10698 if ((sym_seg == seg
10699 || (symbol_section_p (fixP->fx_addsy)
10700 && sym_seg != absolute_section))
10701 && !generic_force_reloc (fixP))
10702 {
10703 /* Yes, we add the values in twice. This is because
10704 bfd_install_relocation subtracts them out again. I think
10705 bfd_install_relocation is broken, but I don't dare change
10706 it. FIXME. */
10707 value += fixP->fx_where + fixP->fx_frag->fr_address;
10708 }
10709 }
10710 #endif
10711 #if defined (OBJ_COFF) && defined (TE_PE)
10712 /* For some reason, the PE format does not store a
10713 section address offset for a PC relative symbol. */
10714 if (S_GET_SEGMENT (fixP->fx_addsy) != seg
10715 || S_IS_WEAK (fixP->fx_addsy))
10716 value += md_pcrel_from (fixP);
10717 #endif
10718 }
10719 #if defined (OBJ_COFF) && defined (TE_PE)
10720 if (fixP->fx_addsy != NULL
10721 && S_IS_WEAK (fixP->fx_addsy)
10722 /* PR 16858: Do not modify weak function references. */
10723 && ! fixP->fx_pcrel)
10724 {
10725 #if !defined (TE_PEP)
10726 /* For x86 PE weak function symbols are neither PC-relative
10727 nor do they set S_IS_FUNCTION. So the only reliable way
10728 to detect them is to check the flags of their containing
10729 section. */
10730 if (S_GET_SEGMENT (fixP->fx_addsy) != NULL
10731 && S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_CODE)
10732 ;
10733 else
10734 #endif
10735 value -= S_GET_VALUE (fixP->fx_addsy);
10736 }
10737 #endif
10738
10739 /* Fix a few things - the dynamic linker expects certain values here,
10740 and we must not disappoint it. */
10741 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
10742 if (IS_ELF && fixP->fx_addsy)
10743 switch (fixP->fx_r_type)
10744 {
10745 case BFD_RELOC_386_PLT32:
10746 case BFD_RELOC_X86_64_PLT32:
10747 /* Make the jump instruction point to the address of the operand.
10748 At runtime we merely add the offset to the actual PLT entry.
10749 NB: Subtract the offset size only for jump instructions. */
10750 if (fixP->fx_pcrel)
10751 value = -4;
10752 break;
10753
10754 case BFD_RELOC_386_TLS_GD:
10755 case BFD_RELOC_386_TLS_LDM:
10756 case BFD_RELOC_386_TLS_IE_32:
10757 case BFD_RELOC_386_TLS_IE:
10758 case BFD_RELOC_386_TLS_GOTIE:
10759 case BFD_RELOC_386_TLS_GOTDESC:
10760 case BFD_RELOC_X86_64_TLSGD:
10761 case BFD_RELOC_X86_64_TLSLD:
10762 case BFD_RELOC_X86_64_GOTTPOFF:
10763 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
10764 value = 0; /* Fully resolved at runtime. No addend. */
10765 /* Fallthrough */
10766 case BFD_RELOC_386_TLS_LE:
10767 case BFD_RELOC_386_TLS_LDO_32:
10768 case BFD_RELOC_386_TLS_LE_32:
10769 case BFD_RELOC_X86_64_DTPOFF32:
10770 case BFD_RELOC_X86_64_DTPOFF64:
10771 case BFD_RELOC_X86_64_TPOFF32:
10772 case BFD_RELOC_X86_64_TPOFF64:
10773 S_SET_THREAD_LOCAL (fixP->fx_addsy);
10774 break;
10775
10776 case BFD_RELOC_386_TLS_DESC_CALL:
10777 case BFD_RELOC_X86_64_TLSDESC_CALL:
10778 value = 0; /* Fully resolved at runtime. No addend. */
10779 S_SET_THREAD_LOCAL (fixP->fx_addsy);
10780 fixP->fx_done = 0;
10781 return;
10782
10783 case BFD_RELOC_VTABLE_INHERIT:
10784 case BFD_RELOC_VTABLE_ENTRY:
10785 fixP->fx_done = 0;
10786 return;
10787
10788 default:
10789 break;
10790 }
10791 #endif /* defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) */
10792 *valP = value;
10793 #endif /* !defined (TE_Mach) */
10794
10795 /* Are we finished with this relocation now? */
10796 if (fixP->fx_addsy == NULL)
10797 fixP->fx_done = 1;
10798 #if defined (OBJ_COFF) && defined (TE_PE)
10799 else if (fixP->fx_addsy != NULL && S_IS_WEAK (fixP->fx_addsy))
10800 {
10801 fixP->fx_done = 0;
10802 /* Remember value for tc_gen_reloc. */
10803 fixP->fx_addnumber = value;
10804 /* Clear out the frag for now. */
10805 value = 0;
10806 }
10807 #endif
10808 else if (use_rela_relocations)
10809 {
10810 fixP->fx_no_overflow = 1;
10811 /* Remember value for tc_gen_reloc. */
10812 fixP->fx_addnumber = value;
10813 value = 0;
10814 }
10815
10816 md_number_to_chars (p, value, fixP->fx_size);
10817 }
10818 \f
10819 const char *
10820 md_atof (int type, char *litP, int *sizeP)
10821 {
10822 /* This outputs the LITTLENUMs in REVERSE order;
10823 in accord with the bigendian 386. */
10824 return ieee_md_atof (type, litP, sizeP, FALSE);
10825 }
10826 \f
10827 static char output_invalid_buf[sizeof (unsigned char) * 2 + 6];
10828
10829 static char *
10830 output_invalid (int c)
10831 {
10832 if (ISPRINT (c))
10833 snprintf (output_invalid_buf, sizeof (output_invalid_buf),
10834 "'%c'", c);
10835 else
10836 snprintf (output_invalid_buf, sizeof (output_invalid_buf),
10837 "(0x%x)", (unsigned char) c);
10838 return output_invalid_buf;
10839 }
10840
10841 /* REG_STRING starts *before* REGISTER_PREFIX. */
10842
10843 static const reg_entry *
10844 parse_real_register (char *reg_string, char **end_op)
10845 {
10846 char *s = reg_string;
10847 char *p;
10848 char reg_name_given[MAX_REG_NAME_SIZE + 1];
10849 const reg_entry *r;
10850
10851 /* Skip possible REGISTER_PREFIX and possible whitespace. */
10852 if (*s == REGISTER_PREFIX)
10853 ++s;
10854
10855 if (is_space_char (*s))
10856 ++s;
10857
10858 p = reg_name_given;
10859 while ((*p++ = register_chars[(unsigned char) *s]) != '\0')
10860 {
10861 if (p >= reg_name_given + MAX_REG_NAME_SIZE)
10862 return (const reg_entry *) NULL;
10863 s++;
10864 }
10865
10866 /* For naked regs, make sure that we are not dealing with an identifier.
10867 This prevents confusing an identifier like `eax_var' with register
10868 `eax'. */
10869 if (allow_naked_reg && identifier_chars[(unsigned char) *s])
10870 return (const reg_entry *) NULL;
10871
10872 *end_op = s;
10873
10874 r = (const reg_entry *) hash_find (reg_hash, reg_name_given);
10875
10876 /* Handle floating point regs, allowing spaces in the (i) part. */
10877 if (r == i386_regtab /* %st is first entry of table */)
10878 {
10879 if (!cpu_arch_flags.bitfield.cpu8087
10880 && !cpu_arch_flags.bitfield.cpu287
10881 && !cpu_arch_flags.bitfield.cpu387)
10882 return (const reg_entry *) NULL;
10883
10884 if (is_space_char (*s))
10885 ++s;
10886 if (*s == '(')
10887 {
10888 ++s;
10889 if (is_space_char (*s))
10890 ++s;
10891 if (*s >= '0' && *s <= '7')
10892 {
10893 int fpr = *s - '0';
10894 ++s;
10895 if (is_space_char (*s))
10896 ++s;
10897 if (*s == ')')
10898 {
10899 *end_op = s + 1;
10900 r = (const reg_entry *) hash_find (reg_hash, "st(0)");
10901 know (r);
10902 return r + fpr;
10903 }
10904 }
10905 /* We have "%st(" then garbage. */
10906 return (const reg_entry *) NULL;
10907 }
10908 }
10909
10910 if (r == NULL || allow_pseudo_reg)
10911 return r;
10912
10913 if (operand_type_all_zero (&r->reg_type))
10914 return (const reg_entry *) NULL;
10915
10916 if ((r->reg_type.bitfield.dword
10917 || (r->reg_type.bitfield.class == SReg && r->reg_num > 3)
10918 || r->reg_type.bitfield.class == RegCR
10919 || r->reg_type.bitfield.class == RegDR
10920 || r->reg_type.bitfield.class == RegTR)
10921 && !cpu_arch_flags.bitfield.cpui386)
10922 return (const reg_entry *) NULL;
10923
10924 if (r->reg_type.bitfield.class == RegMMX && !cpu_arch_flags.bitfield.cpummx)
10925 return (const reg_entry *) NULL;
10926
10927 if (!cpu_arch_flags.bitfield.cpuavx512f)
10928 {
10929 if (r->reg_type.bitfield.zmmword
10930 || r->reg_type.bitfield.class == RegMask)
10931 return (const reg_entry *) NULL;
10932
10933 if (!cpu_arch_flags.bitfield.cpuavx)
10934 {
10935 if (r->reg_type.bitfield.ymmword)
10936 return (const reg_entry *) NULL;
10937
10938 if (!cpu_arch_flags.bitfield.cpusse && r->reg_type.bitfield.xmmword)
10939 return (const reg_entry *) NULL;
10940 }
10941 }
10942
10943 if (r->reg_type.bitfield.class == RegBND && !cpu_arch_flags.bitfield.cpumpx)
10944 return (const reg_entry *) NULL;
10945
10946 /* Don't allow fake index register unless allow_index_reg isn't 0. */
10947 if (!allow_index_reg && r->reg_num == RegIZ)
10948 return (const reg_entry *) NULL;
10949
10950 /* Upper 16 vector registers are only available with VREX in 64bit
10951 mode, and require EVEX encoding. */
10952 if (r->reg_flags & RegVRex)
10953 {
10954 if (!cpu_arch_flags.bitfield.cpuavx512f
10955 || flag_code != CODE_64BIT)
10956 return (const reg_entry *) NULL;
10957
10958 i.vec_encoding = vex_encoding_evex;
10959 }
10960
10961 if (((r->reg_flags & (RegRex64 | RegRex)) || r->reg_type.bitfield.qword)
10962 && (!cpu_arch_flags.bitfield.cpulm || r->reg_type.bitfield.class != RegCR)
10963 && flag_code != CODE_64BIT)
10964 return (const reg_entry *) NULL;
10965
10966 if (r->reg_type.bitfield.class == SReg && r->reg_num == RegFlat
10967 && !intel_syntax)
10968 return (const reg_entry *) NULL;
10969
10970 return r;
10971 }
10972
10973 /* REG_STRING starts *before* REGISTER_PREFIX. */
10974
10975 static const reg_entry *
10976 parse_register (char *reg_string, char **end_op)
10977 {
10978 const reg_entry *r;
10979
10980 if (*reg_string == REGISTER_PREFIX || allow_naked_reg)
10981 r = parse_real_register (reg_string, end_op);
10982 else
10983 r = NULL;
10984 if (!r)
10985 {
10986 char *save = input_line_pointer;
10987 char c;
10988 symbolS *symbolP;
10989
10990 input_line_pointer = reg_string;
10991 c = get_symbol_name (&reg_string);
10992 symbolP = symbol_find (reg_string);
10993 if (symbolP && S_GET_SEGMENT (symbolP) == reg_section)
10994 {
10995 const expressionS *e = symbol_get_value_expression (symbolP);
10996
10997 know (e->X_op == O_register);
10998 know (e->X_add_number >= 0
10999 && (valueT) e->X_add_number < i386_regtab_size);
11000 r = i386_regtab + e->X_add_number;
11001 if ((r->reg_flags & RegVRex))
11002 i.vec_encoding = vex_encoding_evex;
11003 *end_op = input_line_pointer;
11004 }
11005 *input_line_pointer = c;
11006 input_line_pointer = save;
11007 }
11008 return r;
11009 }
11010
11011 int
11012 i386_parse_name (char *name, expressionS *e, char *nextcharP)
11013 {
11014 const reg_entry *r;
11015 char *end = input_line_pointer;
11016
11017 *end = *nextcharP;
11018 r = parse_register (name, &input_line_pointer);
11019 if (r && end <= input_line_pointer)
11020 {
11021 *nextcharP = *input_line_pointer;
11022 *input_line_pointer = 0;
11023 e->X_op = O_register;
11024 e->X_add_number = r - i386_regtab;
11025 return 1;
11026 }
11027 input_line_pointer = end;
11028 *end = 0;
11029 return intel_syntax ? i386_intel_parse_name (name, e) : 0;
11030 }
11031
11032 void
11033 md_operand (expressionS *e)
11034 {
11035 char *end;
11036 const reg_entry *r;
11037
11038 switch (*input_line_pointer)
11039 {
11040 case REGISTER_PREFIX:
11041 r = parse_real_register (input_line_pointer, &end);
11042 if (r)
11043 {
11044 e->X_op = O_register;
11045 e->X_add_number = r - i386_regtab;
11046 input_line_pointer = end;
11047 }
11048 break;
11049
11050 case '[':
11051 gas_assert (intel_syntax);
11052 end = input_line_pointer++;
11053 expression (e);
11054 if (*input_line_pointer == ']')
11055 {
11056 ++input_line_pointer;
11057 e->X_op_symbol = make_expr_symbol (e);
11058 e->X_add_symbol = NULL;
11059 e->X_add_number = 0;
11060 e->X_op = O_index;
11061 }
11062 else
11063 {
11064 e->X_op = O_absent;
11065 input_line_pointer = end;
11066 }
11067 break;
11068 }
11069 }
11070
11071 \f
11072 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11073 const char *md_shortopts = "kVQ:sqnO::";
11074 #else
11075 const char *md_shortopts = "qnO::";
11076 #endif
11077
11078 #define OPTION_32 (OPTION_MD_BASE + 0)
11079 #define OPTION_64 (OPTION_MD_BASE + 1)
11080 #define OPTION_DIVIDE (OPTION_MD_BASE + 2)
11081 #define OPTION_MARCH (OPTION_MD_BASE + 3)
11082 #define OPTION_MTUNE (OPTION_MD_BASE + 4)
11083 #define OPTION_MMNEMONIC (OPTION_MD_BASE + 5)
11084 #define OPTION_MSYNTAX (OPTION_MD_BASE + 6)
11085 #define OPTION_MINDEX_REG (OPTION_MD_BASE + 7)
11086 #define OPTION_MNAKED_REG (OPTION_MD_BASE + 8)
11087 #define OPTION_MRELAX_RELOCATIONS (OPTION_MD_BASE + 9)
11088 #define OPTION_MSSE2AVX (OPTION_MD_BASE + 10)
11089 #define OPTION_MSSE_CHECK (OPTION_MD_BASE + 11)
11090 #define OPTION_MOPERAND_CHECK (OPTION_MD_BASE + 12)
11091 #define OPTION_MAVXSCALAR (OPTION_MD_BASE + 13)
11092 #define OPTION_X32 (OPTION_MD_BASE + 14)
11093 #define OPTION_MADD_BND_PREFIX (OPTION_MD_BASE + 15)
11094 #define OPTION_MEVEXLIG (OPTION_MD_BASE + 16)
11095 #define OPTION_MEVEXWIG (OPTION_MD_BASE + 17)
11096 #define OPTION_MBIG_OBJ (OPTION_MD_BASE + 18)
11097 #define OPTION_MOMIT_LOCK_PREFIX (OPTION_MD_BASE + 19)
11098 #define OPTION_MEVEXRCIG (OPTION_MD_BASE + 20)
11099 #define OPTION_MSHARED (OPTION_MD_BASE + 21)
11100 #define OPTION_MAMD64 (OPTION_MD_BASE + 22)
11101 #define OPTION_MINTEL64 (OPTION_MD_BASE + 23)
11102 #define OPTION_MFENCE_AS_LOCK_ADD (OPTION_MD_BASE + 24)
11103 #define OPTION_X86_USED_NOTE (OPTION_MD_BASE + 25)
11104 #define OPTION_MVEXWIG (OPTION_MD_BASE + 26)
11105
11106 struct option md_longopts[] =
11107 {
11108 {"32", no_argument, NULL, OPTION_32},
11109 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
11110 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
11111 {"64", no_argument, NULL, OPTION_64},
11112 #endif
11113 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11114 {"x32", no_argument, NULL, OPTION_X32},
11115 {"mshared", no_argument, NULL, OPTION_MSHARED},
11116 {"mx86-used-note", required_argument, NULL, OPTION_X86_USED_NOTE},
11117 #endif
11118 {"divide", no_argument, NULL, OPTION_DIVIDE},
11119 {"march", required_argument, NULL, OPTION_MARCH},
11120 {"mtune", required_argument, NULL, OPTION_MTUNE},
11121 {"mmnemonic", required_argument, NULL, OPTION_MMNEMONIC},
11122 {"msyntax", required_argument, NULL, OPTION_MSYNTAX},
11123 {"mindex-reg", no_argument, NULL, OPTION_MINDEX_REG},
11124 {"mnaked-reg", no_argument, NULL, OPTION_MNAKED_REG},
11125 {"msse2avx", no_argument, NULL, OPTION_MSSE2AVX},
11126 {"msse-check", required_argument, NULL, OPTION_MSSE_CHECK},
11127 {"moperand-check", required_argument, NULL, OPTION_MOPERAND_CHECK},
11128 {"mavxscalar", required_argument, NULL, OPTION_MAVXSCALAR},
11129 {"mvexwig", required_argument, NULL, OPTION_MVEXWIG},
11130 {"madd-bnd-prefix", no_argument, NULL, OPTION_MADD_BND_PREFIX},
11131 {"mevexlig", required_argument, NULL, OPTION_MEVEXLIG},
11132 {"mevexwig", required_argument, NULL, OPTION_MEVEXWIG},
11133 # if defined (TE_PE) || defined (TE_PEP)
11134 {"mbig-obj", no_argument, NULL, OPTION_MBIG_OBJ},
11135 #endif
11136 {"momit-lock-prefix", required_argument, NULL, OPTION_MOMIT_LOCK_PREFIX},
11137 {"mfence-as-lock-add", required_argument, NULL, OPTION_MFENCE_AS_LOCK_ADD},
11138 {"mrelax-relocations", required_argument, NULL, OPTION_MRELAX_RELOCATIONS},
11139 {"mevexrcig", required_argument, NULL, OPTION_MEVEXRCIG},
11140 {"mamd64", no_argument, NULL, OPTION_MAMD64},
11141 {"mintel64", no_argument, NULL, OPTION_MINTEL64},
11142 {NULL, no_argument, NULL, 0}
11143 };
11144 size_t md_longopts_size = sizeof (md_longopts);
11145
11146 int
11147 md_parse_option (int c, const char *arg)
11148 {
11149 unsigned int j;
11150 char *arch, *next, *saved;
11151
11152 switch (c)
11153 {
11154 case 'n':
11155 optimize_align_code = 0;
11156 break;
11157
11158 case 'q':
11159 quiet_warnings = 1;
11160 break;
11161
11162 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11163 /* -Qy, -Qn: SVR4 arguments controlling whether a .comment section
11164 should be emitted or not. FIXME: Not implemented. */
11165 case 'Q':
11166 if ((arg[0] != 'y' && arg[0] != 'n') || arg[1])
11167 return 0;
11168 break;
11169
11170 /* -V: SVR4 argument to print version ID. */
11171 case 'V':
11172 print_version_id ();
11173 break;
11174
11175 /* -k: Ignore for FreeBSD compatibility. */
11176 case 'k':
11177 break;
11178
11179 case 's':
11180 /* -s: On i386 Solaris, this tells the native assembler to use
11181 .stab instead of .stab.excl. We always use .stab anyhow. */
11182 break;
11183
11184 case OPTION_MSHARED:
11185 shared = 1;
11186 break;
11187
11188 case OPTION_X86_USED_NOTE:
11189 if (strcasecmp (arg, "yes") == 0)
11190 x86_used_note = 1;
11191 else if (strcasecmp (arg, "no") == 0)
11192 x86_used_note = 0;
11193 else
11194 as_fatal (_("invalid -mx86-used-note= option: `%s'"), arg);
11195 break;
11196
11197
11198 #endif
11199 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
11200 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
11201 case OPTION_64:
11202 {
11203 const char **list, **l;
11204
11205 list = bfd_target_list ();
11206 for (l = list; *l != NULL; l++)
11207 if (CONST_STRNEQ (*l, "elf64-x86-64")
11208 || strcmp (*l, "coff-x86-64") == 0
11209 || strcmp (*l, "pe-x86-64") == 0
11210 || strcmp (*l, "pei-x86-64") == 0
11211 || strcmp (*l, "mach-o-x86-64") == 0)
11212 {
11213 default_arch = "x86_64";
11214 break;
11215 }
11216 if (*l == NULL)
11217 as_fatal (_("no compiled in support for x86_64"));
11218 free (list);
11219 }
11220 break;
11221 #endif
11222
11223 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11224 case OPTION_X32:
11225 if (IS_ELF)
11226 {
11227 const char **list, **l;
11228
11229 list = bfd_target_list ();
11230 for (l = list; *l != NULL; l++)
11231 if (CONST_STRNEQ (*l, "elf32-x86-64"))
11232 {
11233 default_arch = "x86_64:32";
11234 break;
11235 }
11236 if (*l == NULL)
11237 as_fatal (_("no compiled in support for 32bit x86_64"));
11238 free (list);
11239 }
11240 else
11241 as_fatal (_("32bit x86_64 is only supported for ELF"));
11242 break;
11243 #endif
11244
11245 case OPTION_32:
11246 default_arch = "i386";
11247 break;
11248
11249 case OPTION_DIVIDE:
11250 #ifdef SVR4_COMMENT_CHARS
11251 {
11252 char *n, *t;
11253 const char *s;
11254
11255 n = XNEWVEC (char, strlen (i386_comment_chars) + 1);
11256 t = n;
11257 for (s = i386_comment_chars; *s != '\0'; s++)
11258 if (*s != '/')
11259 *t++ = *s;
11260 *t = '\0';
11261 i386_comment_chars = n;
11262 }
11263 #endif
11264 break;
11265
11266 case OPTION_MARCH:
11267 saved = xstrdup (arg);
11268 arch = saved;
11269 /* Allow -march=+nosse. */
11270 if (*arch == '+')
11271 arch++;
11272 do
11273 {
11274 if (*arch == '.')
11275 as_fatal (_("invalid -march= option: `%s'"), arg);
11276 next = strchr (arch, '+');
11277 if (next)
11278 *next++ = '\0';
11279 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
11280 {
11281 if (strcmp (arch, cpu_arch [j].name) == 0)
11282 {
11283 /* Processor. */
11284 if (! cpu_arch[j].flags.bitfield.cpui386)
11285 continue;
11286
11287 cpu_arch_name = cpu_arch[j].name;
11288 cpu_sub_arch_name = NULL;
11289 cpu_arch_flags = cpu_arch[j].flags;
11290 cpu_arch_isa = cpu_arch[j].type;
11291 cpu_arch_isa_flags = cpu_arch[j].flags;
11292 if (!cpu_arch_tune_set)
11293 {
11294 cpu_arch_tune = cpu_arch_isa;
11295 cpu_arch_tune_flags = cpu_arch_isa_flags;
11296 }
11297 break;
11298 }
11299 else if (*cpu_arch [j].name == '.'
11300 && strcmp (arch, cpu_arch [j].name + 1) == 0)
11301 {
11302 /* ISA extension. */
11303 i386_cpu_flags flags;
11304
11305 flags = cpu_flags_or (cpu_arch_flags,
11306 cpu_arch[j].flags);
11307
11308 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
11309 {
11310 if (cpu_sub_arch_name)
11311 {
11312 char *name = cpu_sub_arch_name;
11313 cpu_sub_arch_name = concat (name,
11314 cpu_arch[j].name,
11315 (const char *) NULL);
11316 free (name);
11317 }
11318 else
11319 cpu_sub_arch_name = xstrdup (cpu_arch[j].name);
11320 cpu_arch_flags = flags;
11321 cpu_arch_isa_flags = flags;
11322 }
11323 else
11324 cpu_arch_isa_flags
11325 = cpu_flags_or (cpu_arch_isa_flags,
11326 cpu_arch[j].flags);
11327 break;
11328 }
11329 }
11330
11331 if (j >= ARRAY_SIZE (cpu_arch))
11332 {
11333 /* Disable an ISA extension. */
11334 for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
11335 if (strcmp (arch, cpu_noarch [j].name) == 0)
11336 {
11337 i386_cpu_flags flags;
11338
11339 flags = cpu_flags_and_not (cpu_arch_flags,
11340 cpu_noarch[j].flags);
11341 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
11342 {
11343 if (cpu_sub_arch_name)
11344 {
11345 char *name = cpu_sub_arch_name;
11346 cpu_sub_arch_name = concat (arch,
11347 (const char *) NULL);
11348 free (name);
11349 }
11350 else
11351 cpu_sub_arch_name = xstrdup (arch);
11352 cpu_arch_flags = flags;
11353 cpu_arch_isa_flags = flags;
11354 }
11355 break;
11356 }
11357
11358 if (j >= ARRAY_SIZE (cpu_noarch))
11359 j = ARRAY_SIZE (cpu_arch);
11360 }
11361
11362 if (j >= ARRAY_SIZE (cpu_arch))
11363 as_fatal (_("invalid -march= option: `%s'"), arg);
11364
11365 arch = next;
11366 }
11367 while (next != NULL);
11368 free (saved);
11369 break;
11370
11371 case OPTION_MTUNE:
11372 if (*arg == '.')
11373 as_fatal (_("invalid -mtune= option: `%s'"), arg);
11374 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
11375 {
11376 if (strcmp (arg, cpu_arch [j].name) == 0)
11377 {
11378 cpu_arch_tune_set = 1;
11379 cpu_arch_tune = cpu_arch [j].type;
11380 cpu_arch_tune_flags = cpu_arch[j].flags;
11381 break;
11382 }
11383 }
11384 if (j >= ARRAY_SIZE (cpu_arch))
11385 as_fatal (_("invalid -mtune= option: `%s'"), arg);
11386 break;
11387
11388 case OPTION_MMNEMONIC:
11389 if (strcasecmp (arg, "att") == 0)
11390 intel_mnemonic = 0;
11391 else if (strcasecmp (arg, "intel") == 0)
11392 intel_mnemonic = 1;
11393 else
11394 as_fatal (_("invalid -mmnemonic= option: `%s'"), arg);
11395 break;
11396
11397 case OPTION_MSYNTAX:
11398 if (strcasecmp (arg, "att") == 0)
11399 intel_syntax = 0;
11400 else if (strcasecmp (arg, "intel") == 0)
11401 intel_syntax = 1;
11402 else
11403 as_fatal (_("invalid -msyntax= option: `%s'"), arg);
11404 break;
11405
11406 case OPTION_MINDEX_REG:
11407 allow_index_reg = 1;
11408 break;
11409
11410 case OPTION_MNAKED_REG:
11411 allow_naked_reg = 1;
11412 break;
11413
11414 case OPTION_MSSE2AVX:
11415 sse2avx = 1;
11416 break;
11417
11418 case OPTION_MSSE_CHECK:
11419 if (strcasecmp (arg, "error") == 0)
11420 sse_check = check_error;
11421 else if (strcasecmp (arg, "warning") == 0)
11422 sse_check = check_warning;
11423 else if (strcasecmp (arg, "none") == 0)
11424 sse_check = check_none;
11425 else
11426 as_fatal (_("invalid -msse-check= option: `%s'"), arg);
11427 break;
11428
11429 case OPTION_MOPERAND_CHECK:
11430 if (strcasecmp (arg, "error") == 0)
11431 operand_check = check_error;
11432 else if (strcasecmp (arg, "warning") == 0)
11433 operand_check = check_warning;
11434 else if (strcasecmp (arg, "none") == 0)
11435 operand_check = check_none;
11436 else
11437 as_fatal (_("invalid -moperand-check= option: `%s'"), arg);
11438 break;
11439
11440 case OPTION_MAVXSCALAR:
11441 if (strcasecmp (arg, "128") == 0)
11442 avxscalar = vex128;
11443 else if (strcasecmp (arg, "256") == 0)
11444 avxscalar = vex256;
11445 else
11446 as_fatal (_("invalid -mavxscalar= option: `%s'"), arg);
11447 break;
11448
11449 case OPTION_MVEXWIG:
11450 if (strcmp (arg, "0") == 0)
11451 vexwig = vexw0;
11452 else if (strcmp (arg, "1") == 0)
11453 vexwig = vexw1;
11454 else
11455 as_fatal (_("invalid -mvexwig= option: `%s'"), arg);
11456 break;
11457
11458 case OPTION_MADD_BND_PREFIX:
11459 add_bnd_prefix = 1;
11460 break;
11461
11462 case OPTION_MEVEXLIG:
11463 if (strcmp (arg, "128") == 0)
11464 evexlig = evexl128;
11465 else if (strcmp (arg, "256") == 0)
11466 evexlig = evexl256;
11467 else if (strcmp (arg, "512") == 0)
11468 evexlig = evexl512;
11469 else
11470 as_fatal (_("invalid -mevexlig= option: `%s'"), arg);
11471 break;
11472
11473 case OPTION_MEVEXRCIG:
11474 if (strcmp (arg, "rne") == 0)
11475 evexrcig = rne;
11476 else if (strcmp (arg, "rd") == 0)
11477 evexrcig = rd;
11478 else if (strcmp (arg, "ru") == 0)
11479 evexrcig = ru;
11480 else if (strcmp (arg, "rz") == 0)
11481 evexrcig = rz;
11482 else
11483 as_fatal (_("invalid -mevexrcig= option: `%s'"), arg);
11484 break;
11485
11486 case OPTION_MEVEXWIG:
11487 if (strcmp (arg, "0") == 0)
11488 evexwig = evexw0;
11489 else if (strcmp (arg, "1") == 0)
11490 evexwig = evexw1;
11491 else
11492 as_fatal (_("invalid -mevexwig= option: `%s'"), arg);
11493 break;
11494
11495 # if defined (TE_PE) || defined (TE_PEP)
11496 case OPTION_MBIG_OBJ:
11497 use_big_obj = 1;
11498 break;
11499 #endif
11500
11501 case OPTION_MOMIT_LOCK_PREFIX:
11502 if (strcasecmp (arg, "yes") == 0)
11503 omit_lock_prefix = 1;
11504 else if (strcasecmp (arg, "no") == 0)
11505 omit_lock_prefix = 0;
11506 else
11507 as_fatal (_("invalid -momit-lock-prefix= option: `%s'"), arg);
11508 break;
11509
11510 case OPTION_MFENCE_AS_LOCK_ADD:
11511 if (strcasecmp (arg, "yes") == 0)
11512 avoid_fence = 1;
11513 else if (strcasecmp (arg, "no") == 0)
11514 avoid_fence = 0;
11515 else
11516 as_fatal (_("invalid -mfence-as-lock-add= option: `%s'"), arg);
11517 break;
11518
11519 case OPTION_MRELAX_RELOCATIONS:
11520 if (strcasecmp (arg, "yes") == 0)
11521 generate_relax_relocations = 1;
11522 else if (strcasecmp (arg, "no") == 0)
11523 generate_relax_relocations = 0;
11524 else
11525 as_fatal (_("invalid -mrelax-relocations= option: `%s'"), arg);
11526 break;
11527
11528 case OPTION_MAMD64:
11529 intel64 = 0;
11530 break;
11531
11532 case OPTION_MINTEL64:
11533 intel64 = 1;
11534 break;
11535
11536 case 'O':
11537 if (arg == NULL)
11538 {
11539 optimize = 1;
11540 /* Turn off -Os. */
11541 optimize_for_space = 0;
11542 }
11543 else if (*arg == 's')
11544 {
11545 optimize_for_space = 1;
11546 /* Turn on all encoding optimizations. */
11547 optimize = INT_MAX;
11548 }
11549 else
11550 {
11551 optimize = atoi (arg);
11552 /* Turn off -Os. */
11553 optimize_for_space = 0;
11554 }
11555 break;
11556
11557 default:
11558 return 0;
11559 }
11560 return 1;
11561 }
11562
11563 #define MESSAGE_TEMPLATE \
11564 " "
11565
11566 static char *
11567 output_message (FILE *stream, char *p, char *message, char *start,
11568 int *left_p, const char *name, int len)
11569 {
11570 int size = sizeof (MESSAGE_TEMPLATE);
11571 int left = *left_p;
11572
11573 /* Reserve 2 spaces for ", " or ",\0" */
11574 left -= len + 2;
11575
11576 /* Check if there is any room. */
11577 if (left >= 0)
11578 {
11579 if (p != start)
11580 {
11581 *p++ = ',';
11582 *p++ = ' ';
11583 }
11584 p = mempcpy (p, name, len);
11585 }
11586 else
11587 {
11588 /* Output the current message now and start a new one. */
11589 *p++ = ',';
11590 *p = '\0';
11591 fprintf (stream, "%s\n", message);
11592 p = start;
11593 left = size - (start - message) - len - 2;
11594
11595 gas_assert (left >= 0);
11596
11597 p = mempcpy (p, name, len);
11598 }
11599
11600 *left_p = left;
11601 return p;
11602 }
11603
11604 static void
11605 show_arch (FILE *stream, int ext, int check)
11606 {
11607 static char message[] = MESSAGE_TEMPLATE;
11608 char *start = message + 27;
11609 char *p;
11610 int size = sizeof (MESSAGE_TEMPLATE);
11611 int left;
11612 const char *name;
11613 int len;
11614 unsigned int j;
11615
11616 p = start;
11617 left = size - (start - message);
11618 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
11619 {
11620 /* Should it be skipped? */
11621 if (cpu_arch [j].skip)
11622 continue;
11623
11624 name = cpu_arch [j].name;
11625 len = cpu_arch [j].len;
11626 if (*name == '.')
11627 {
11628 /* It is an extension. Skip if we aren't asked to show it. */
11629 if (ext)
11630 {
11631 name++;
11632 len--;
11633 }
11634 else
11635 continue;
11636 }
11637 else if (ext)
11638 {
11639 /* It is an processor. Skip if we show only extension. */
11640 continue;
11641 }
11642 else if (check && ! cpu_arch[j].flags.bitfield.cpui386)
11643 {
11644 /* It is an impossible processor - skip. */
11645 continue;
11646 }
11647
11648 p = output_message (stream, p, message, start, &left, name, len);
11649 }
11650
11651 /* Display disabled extensions. */
11652 if (ext)
11653 for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
11654 {
11655 name = cpu_noarch [j].name;
11656 len = cpu_noarch [j].len;
11657 p = output_message (stream, p, message, start, &left, name,
11658 len);
11659 }
11660
11661 *p = '\0';
11662 fprintf (stream, "%s\n", message);
11663 }
11664
11665 void
11666 md_show_usage (FILE *stream)
11667 {
11668 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11669 fprintf (stream, _("\
11670 -Qy, -Qn ignored\n\
11671 -V print assembler version number\n\
11672 -k ignored\n"));
11673 #endif
11674 fprintf (stream, _("\
11675 -n Do not optimize code alignment\n\
11676 -q quieten some warnings\n"));
11677 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11678 fprintf (stream, _("\
11679 -s ignored\n"));
11680 #endif
11681 #if defined BFD64 && (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
11682 || defined (TE_PE) || defined (TE_PEP))
11683 fprintf (stream, _("\
11684 --32/--64/--x32 generate 32bit/64bit/x32 code\n"));
11685 #endif
11686 #ifdef SVR4_COMMENT_CHARS
11687 fprintf (stream, _("\
11688 --divide do not treat `/' as a comment character\n"));
11689 #else
11690 fprintf (stream, _("\
11691 --divide ignored\n"));
11692 #endif
11693 fprintf (stream, _("\
11694 -march=CPU[,+EXTENSION...]\n\
11695 generate code for CPU and EXTENSION, CPU is one of:\n"));
11696 show_arch (stream, 0, 1);
11697 fprintf (stream, _("\
11698 EXTENSION is combination of:\n"));
11699 show_arch (stream, 1, 0);
11700 fprintf (stream, _("\
11701 -mtune=CPU optimize for CPU, CPU is one of:\n"));
11702 show_arch (stream, 0, 0);
11703 fprintf (stream, _("\
11704 -msse2avx encode SSE instructions with VEX prefix\n"));
11705 fprintf (stream, _("\
11706 -msse-check=[none|error|warning] (default: warning)\n\
11707 check SSE instructions\n"));
11708 fprintf (stream, _("\
11709 -moperand-check=[none|error|warning] (default: warning)\n\
11710 check operand combinations for validity\n"));
11711 fprintf (stream, _("\
11712 -mavxscalar=[128|256] (default: 128)\n\
11713 encode scalar AVX instructions with specific vector\n\
11714 length\n"));
11715 fprintf (stream, _("\
11716 -mvexwig=[0|1] (default: 0)\n\
11717 encode VEX instructions with specific VEX.W value\n\
11718 for VEX.W bit ignored instructions\n"));
11719 fprintf (stream, _("\
11720 -mevexlig=[128|256|512] (default: 128)\n\
11721 encode scalar EVEX instructions with specific vector\n\
11722 length\n"));
11723 fprintf (stream, _("\
11724 -mevexwig=[0|1] (default: 0)\n\
11725 encode EVEX instructions with specific EVEX.W value\n\
11726 for EVEX.W bit ignored instructions\n"));
11727 fprintf (stream, _("\
11728 -mevexrcig=[rne|rd|ru|rz] (default: rne)\n\
11729 encode EVEX instructions with specific EVEX.RC value\n\
11730 for SAE-only ignored instructions\n"));
11731 fprintf (stream, _("\
11732 -mmnemonic=[att|intel] "));
11733 if (SYSV386_COMPAT)
11734 fprintf (stream, _("(default: att)\n"));
11735 else
11736 fprintf (stream, _("(default: intel)\n"));
11737 fprintf (stream, _("\
11738 use AT&T/Intel mnemonic\n"));
11739 fprintf (stream, _("\
11740 -msyntax=[att|intel] (default: att)\n\
11741 use AT&T/Intel syntax\n"));
11742 fprintf (stream, _("\
11743 -mindex-reg support pseudo index registers\n"));
11744 fprintf (stream, _("\
11745 -mnaked-reg don't require `%%' prefix for registers\n"));
11746 fprintf (stream, _("\
11747 -madd-bnd-prefix add BND prefix for all valid branches\n"));
11748 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11749 fprintf (stream, _("\
11750 -mshared disable branch optimization for shared code\n"));
11751 fprintf (stream, _("\
11752 -mx86-used-note=[no|yes] "));
11753 if (DEFAULT_X86_USED_NOTE)
11754 fprintf (stream, _("(default: yes)\n"));
11755 else
11756 fprintf (stream, _("(default: no)\n"));
11757 fprintf (stream, _("\
11758 generate x86 used ISA and feature properties\n"));
11759 #endif
11760 #if defined (TE_PE) || defined (TE_PEP)
11761 fprintf (stream, _("\
11762 -mbig-obj generate big object files\n"));
11763 #endif
11764 fprintf (stream, _("\
11765 -momit-lock-prefix=[no|yes] (default: no)\n\
11766 strip all lock prefixes\n"));
11767 fprintf (stream, _("\
11768 -mfence-as-lock-add=[no|yes] (default: no)\n\
11769 encode lfence, mfence and sfence as\n\
11770 lock addl $0x0, (%%{re}sp)\n"));
11771 fprintf (stream, _("\
11772 -mrelax-relocations=[no|yes] "));
11773 if (DEFAULT_GENERATE_X86_RELAX_RELOCATIONS)
11774 fprintf (stream, _("(default: yes)\n"));
11775 else
11776 fprintf (stream, _("(default: no)\n"));
11777 fprintf (stream, _("\
11778 generate relax relocations\n"));
11779 fprintf (stream, _("\
11780 -mamd64 accept only AMD64 ISA [default]\n"));
11781 fprintf (stream, _("\
11782 -mintel64 accept only Intel64 ISA\n"));
11783 }
11784
11785 #if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
11786 || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
11787 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
11788
11789 /* Pick the target format to use. */
11790
11791 const char *
11792 i386_target_format (void)
11793 {
11794 if (!strncmp (default_arch, "x86_64", 6))
11795 {
11796 update_code_flag (CODE_64BIT, 1);
11797 if (default_arch[6] == '\0')
11798 x86_elf_abi = X86_64_ABI;
11799 else
11800 x86_elf_abi = X86_64_X32_ABI;
11801 }
11802 else if (!strcmp (default_arch, "i386"))
11803 update_code_flag (CODE_32BIT, 1);
11804 else if (!strcmp (default_arch, "iamcu"))
11805 {
11806 update_code_flag (CODE_32BIT, 1);
11807 if (cpu_arch_isa == PROCESSOR_UNKNOWN)
11808 {
11809 static const i386_cpu_flags iamcu_flags = CPU_IAMCU_FLAGS;
11810 cpu_arch_name = "iamcu";
11811 cpu_sub_arch_name = NULL;
11812 cpu_arch_flags = iamcu_flags;
11813 cpu_arch_isa = PROCESSOR_IAMCU;
11814 cpu_arch_isa_flags = iamcu_flags;
11815 if (!cpu_arch_tune_set)
11816 {
11817 cpu_arch_tune = cpu_arch_isa;
11818 cpu_arch_tune_flags = cpu_arch_isa_flags;
11819 }
11820 }
11821 else if (cpu_arch_isa != PROCESSOR_IAMCU)
11822 as_fatal (_("Intel MCU doesn't support `%s' architecture"),
11823 cpu_arch_name);
11824 }
11825 else
11826 as_fatal (_("unknown architecture"));
11827
11828 if (cpu_flags_all_zero (&cpu_arch_isa_flags))
11829 cpu_arch_isa_flags = cpu_arch[flag_code == CODE_64BIT].flags;
11830 if (cpu_flags_all_zero (&cpu_arch_tune_flags))
11831 cpu_arch_tune_flags = cpu_arch[flag_code == CODE_64BIT].flags;
11832
11833 switch (OUTPUT_FLAVOR)
11834 {
11835 #if defined (OBJ_MAYBE_AOUT) || defined (OBJ_AOUT)
11836 case bfd_target_aout_flavour:
11837 return AOUT_TARGET_FORMAT;
11838 #endif
11839 #if defined (OBJ_MAYBE_COFF) || defined (OBJ_COFF)
11840 # if defined (TE_PE) || defined (TE_PEP)
11841 case bfd_target_coff_flavour:
11842 if (flag_code == CODE_64BIT)
11843 return use_big_obj ? "pe-bigobj-x86-64" : "pe-x86-64";
11844 else
11845 return "pe-i386";
11846 # elif defined (TE_GO32)
11847 case bfd_target_coff_flavour:
11848 return "coff-go32";
11849 # else
11850 case bfd_target_coff_flavour:
11851 return "coff-i386";
11852 # endif
11853 #endif
11854 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
11855 case bfd_target_elf_flavour:
11856 {
11857 const char *format;
11858
11859 switch (x86_elf_abi)
11860 {
11861 default:
11862 format = ELF_TARGET_FORMAT;
11863 break;
11864 case X86_64_ABI:
11865 use_rela_relocations = 1;
11866 object_64bit = 1;
11867 format = ELF_TARGET_FORMAT64;
11868 break;
11869 case X86_64_X32_ABI:
11870 use_rela_relocations = 1;
11871 object_64bit = 1;
11872 disallow_64bit_reloc = 1;
11873 format = ELF_TARGET_FORMAT32;
11874 break;
11875 }
11876 if (cpu_arch_isa == PROCESSOR_L1OM)
11877 {
11878 if (x86_elf_abi != X86_64_ABI)
11879 as_fatal (_("Intel L1OM is 64bit only"));
11880 return ELF_TARGET_L1OM_FORMAT;
11881 }
11882 else if (cpu_arch_isa == PROCESSOR_K1OM)
11883 {
11884 if (x86_elf_abi != X86_64_ABI)
11885 as_fatal (_("Intel K1OM is 64bit only"));
11886 return ELF_TARGET_K1OM_FORMAT;
11887 }
11888 else if (cpu_arch_isa == PROCESSOR_IAMCU)
11889 {
11890 if (x86_elf_abi != I386_ABI)
11891 as_fatal (_("Intel MCU is 32bit only"));
11892 return ELF_TARGET_IAMCU_FORMAT;
11893 }
11894 else
11895 return format;
11896 }
11897 #endif
11898 #if defined (OBJ_MACH_O)
11899 case bfd_target_mach_o_flavour:
11900 if (flag_code == CODE_64BIT)
11901 {
11902 use_rela_relocations = 1;
11903 object_64bit = 1;
11904 return "mach-o-x86-64";
11905 }
11906 else
11907 return "mach-o-i386";
11908 #endif
11909 default:
11910 abort ();
11911 return NULL;
11912 }
11913 }
11914
11915 #endif /* OBJ_MAYBE_ more than one */
11916 \f
11917 symbolS *
11918 md_undefined_symbol (char *name)
11919 {
11920 if (name[0] == GLOBAL_OFFSET_TABLE_NAME[0]
11921 && name[1] == GLOBAL_OFFSET_TABLE_NAME[1]
11922 && name[2] == GLOBAL_OFFSET_TABLE_NAME[2]
11923 && strcmp (name, GLOBAL_OFFSET_TABLE_NAME) == 0)
11924 {
11925 if (!GOT_symbol)
11926 {
11927 if (symbol_find (name))
11928 as_bad (_("GOT already in symbol table"));
11929 GOT_symbol = symbol_new (name, undefined_section,
11930 (valueT) 0, &zero_address_frag);
11931 };
11932 return GOT_symbol;
11933 }
11934 return 0;
11935 }
11936
11937 /* Round up a section size to the appropriate boundary. */
11938
11939 valueT
11940 md_section_align (segT segment ATTRIBUTE_UNUSED, valueT size)
11941 {
11942 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
11943 if (OUTPUT_FLAVOR == bfd_target_aout_flavour)
11944 {
11945 /* For a.out, force the section size to be aligned. If we don't do
11946 this, BFD will align it for us, but it will not write out the
11947 final bytes of the section. This may be a bug in BFD, but it is
11948 easier to fix it here since that is how the other a.out targets
11949 work. */
11950 int align;
11951
11952 align = bfd_section_alignment (segment);
11953 size = ((size + (1 << align) - 1) & (-((valueT) 1 << align)));
11954 }
11955 #endif
11956
11957 return size;
11958 }
11959
11960 /* On the i386, PC-relative offsets are relative to the start of the
11961 next instruction. That is, the address of the offset, plus its
11962 size, since the offset is always the last part of the insn. */
11963
11964 long
11965 md_pcrel_from (fixS *fixP)
11966 {
11967 return fixP->fx_size + fixP->fx_where + fixP->fx_frag->fr_address;
11968 }
11969
11970 #ifndef I386COFF
11971
11972 static void
11973 s_bss (int ignore ATTRIBUTE_UNUSED)
11974 {
11975 int temp;
11976
11977 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11978 if (IS_ELF)
11979 obj_elf_section_change_hook ();
11980 #endif
11981 temp = get_absolute_expression ();
11982 subseg_set (bss_section, (subsegT) temp);
11983 demand_empty_rest_of_line ();
11984 }
11985
11986 #endif
11987
11988 void
11989 i386_validate_fix (fixS *fixp)
11990 {
11991 if (fixp->fx_subsy)
11992 {
11993 if (fixp->fx_subsy == GOT_symbol)
11994 {
11995 if (fixp->fx_r_type == BFD_RELOC_32_PCREL)
11996 {
11997 if (!object_64bit)
11998 abort ();
11999 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12000 if (fixp->fx_tcbit2)
12001 fixp->fx_r_type = (fixp->fx_tcbit
12002 ? BFD_RELOC_X86_64_REX_GOTPCRELX
12003 : BFD_RELOC_X86_64_GOTPCRELX);
12004 else
12005 #endif
12006 fixp->fx_r_type = BFD_RELOC_X86_64_GOTPCREL;
12007 }
12008 else
12009 {
12010 if (!object_64bit)
12011 fixp->fx_r_type = BFD_RELOC_386_GOTOFF;
12012 else
12013 fixp->fx_r_type = BFD_RELOC_X86_64_GOTOFF64;
12014 }
12015 fixp->fx_subsy = 0;
12016 }
12017 }
12018 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12019 else if (!object_64bit)
12020 {
12021 if (fixp->fx_r_type == BFD_RELOC_386_GOT32
12022 && fixp->fx_tcbit2)
12023 fixp->fx_r_type = BFD_RELOC_386_GOT32X;
12024 }
12025 #endif
12026 }
12027
12028 arelent *
12029 tc_gen_reloc (asection *section ATTRIBUTE_UNUSED, fixS *fixp)
12030 {
12031 arelent *rel;
12032 bfd_reloc_code_real_type code;
12033
12034 switch (fixp->fx_r_type)
12035 {
12036 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12037 case BFD_RELOC_SIZE32:
12038 case BFD_RELOC_SIZE64:
12039 if (S_IS_DEFINED (fixp->fx_addsy)
12040 && !S_IS_EXTERNAL (fixp->fx_addsy))
12041 {
12042 /* Resolve size relocation against local symbol to size of
12043 the symbol plus addend. */
12044 valueT value = S_GET_SIZE (fixp->fx_addsy) + fixp->fx_offset;
12045 if (fixp->fx_r_type == BFD_RELOC_SIZE32
12046 && !fits_in_unsigned_long (value))
12047 as_bad_where (fixp->fx_file, fixp->fx_line,
12048 _("symbol size computation overflow"));
12049 fixp->fx_addsy = NULL;
12050 fixp->fx_subsy = NULL;
12051 md_apply_fix (fixp, (valueT *) &value, NULL);
12052 return NULL;
12053 }
12054 #endif
12055 /* Fall through. */
12056
12057 case BFD_RELOC_X86_64_PLT32:
12058 case BFD_RELOC_X86_64_GOT32:
12059 case BFD_RELOC_X86_64_GOTPCREL:
12060 case BFD_RELOC_X86_64_GOTPCRELX:
12061 case BFD_RELOC_X86_64_REX_GOTPCRELX:
12062 case BFD_RELOC_386_PLT32:
12063 case BFD_RELOC_386_GOT32:
12064 case BFD_RELOC_386_GOT32X:
12065 case BFD_RELOC_386_GOTOFF:
12066 case BFD_RELOC_386_GOTPC:
12067 case BFD_RELOC_386_TLS_GD:
12068 case BFD_RELOC_386_TLS_LDM:
12069 case BFD_RELOC_386_TLS_LDO_32:
12070 case BFD_RELOC_386_TLS_IE_32:
12071 case BFD_RELOC_386_TLS_IE:
12072 case BFD_RELOC_386_TLS_GOTIE:
12073 case BFD_RELOC_386_TLS_LE_32:
12074 case BFD_RELOC_386_TLS_LE:
12075 case BFD_RELOC_386_TLS_GOTDESC:
12076 case BFD_RELOC_386_TLS_DESC_CALL:
12077 case BFD_RELOC_X86_64_TLSGD:
12078 case BFD_RELOC_X86_64_TLSLD:
12079 case BFD_RELOC_X86_64_DTPOFF32:
12080 case BFD_RELOC_X86_64_DTPOFF64:
12081 case BFD_RELOC_X86_64_GOTTPOFF:
12082 case BFD_RELOC_X86_64_TPOFF32:
12083 case BFD_RELOC_X86_64_TPOFF64:
12084 case BFD_RELOC_X86_64_GOTOFF64:
12085 case BFD_RELOC_X86_64_GOTPC32:
12086 case BFD_RELOC_X86_64_GOT64:
12087 case BFD_RELOC_X86_64_GOTPCREL64:
12088 case BFD_RELOC_X86_64_GOTPC64:
12089 case BFD_RELOC_X86_64_GOTPLT64:
12090 case BFD_RELOC_X86_64_PLTOFF64:
12091 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
12092 case BFD_RELOC_X86_64_TLSDESC_CALL:
12093 case BFD_RELOC_RVA:
12094 case BFD_RELOC_VTABLE_ENTRY:
12095 case BFD_RELOC_VTABLE_INHERIT:
12096 #ifdef TE_PE
12097 case BFD_RELOC_32_SECREL:
12098 #endif
12099 code = fixp->fx_r_type;
12100 break;
12101 case BFD_RELOC_X86_64_32S:
12102 if (!fixp->fx_pcrel)
12103 {
12104 /* Don't turn BFD_RELOC_X86_64_32S into BFD_RELOC_32. */
12105 code = fixp->fx_r_type;
12106 break;
12107 }
12108 /* Fall through. */
12109 default:
12110 if (fixp->fx_pcrel)
12111 {
12112 switch (fixp->fx_size)
12113 {
12114 default:
12115 as_bad_where (fixp->fx_file, fixp->fx_line,
12116 _("can not do %d byte pc-relative relocation"),
12117 fixp->fx_size);
12118 code = BFD_RELOC_32_PCREL;
12119 break;
12120 case 1: code = BFD_RELOC_8_PCREL; break;
12121 case 2: code = BFD_RELOC_16_PCREL; break;
12122 case 4: code = BFD_RELOC_32_PCREL; break;
12123 #ifdef BFD64
12124 case 8: code = BFD_RELOC_64_PCREL; break;
12125 #endif
12126 }
12127 }
12128 else
12129 {
12130 switch (fixp->fx_size)
12131 {
12132 default:
12133 as_bad_where (fixp->fx_file, fixp->fx_line,
12134 _("can not do %d byte relocation"),
12135 fixp->fx_size);
12136 code = BFD_RELOC_32;
12137 break;
12138 case 1: code = BFD_RELOC_8; break;
12139 case 2: code = BFD_RELOC_16; break;
12140 case 4: code = BFD_RELOC_32; break;
12141 #ifdef BFD64
12142 case 8: code = BFD_RELOC_64; break;
12143 #endif
12144 }
12145 }
12146 break;
12147 }
12148
12149 if ((code == BFD_RELOC_32
12150 || code == BFD_RELOC_32_PCREL
12151 || code == BFD_RELOC_X86_64_32S)
12152 && GOT_symbol
12153 && fixp->fx_addsy == GOT_symbol)
12154 {
12155 if (!object_64bit)
12156 code = BFD_RELOC_386_GOTPC;
12157 else
12158 code = BFD_RELOC_X86_64_GOTPC32;
12159 }
12160 if ((code == BFD_RELOC_64 || code == BFD_RELOC_64_PCREL)
12161 && GOT_symbol
12162 && fixp->fx_addsy == GOT_symbol)
12163 {
12164 code = BFD_RELOC_X86_64_GOTPC64;
12165 }
12166
12167 rel = XNEW (arelent);
12168 rel->sym_ptr_ptr = XNEW (asymbol *);
12169 *rel->sym_ptr_ptr = symbol_get_bfdsym (fixp->fx_addsy);
12170
12171 rel->address = fixp->fx_frag->fr_address + fixp->fx_where;
12172
12173 if (!use_rela_relocations)
12174 {
12175 /* HACK: Since i386 ELF uses Rel instead of Rela, encode the
12176 vtable entry to be used in the relocation's section offset. */
12177 if (fixp->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
12178 rel->address = fixp->fx_offset;
12179 #if defined (OBJ_COFF) && defined (TE_PE)
12180 else if (fixp->fx_addsy && S_IS_WEAK (fixp->fx_addsy))
12181 rel->addend = fixp->fx_addnumber - (S_GET_VALUE (fixp->fx_addsy) * 2);
12182 else
12183 #endif
12184 rel->addend = 0;
12185 }
12186 /* Use the rela in 64bit mode. */
12187 else
12188 {
12189 if (disallow_64bit_reloc)
12190 switch (code)
12191 {
12192 case BFD_RELOC_X86_64_DTPOFF64:
12193 case BFD_RELOC_X86_64_TPOFF64:
12194 case BFD_RELOC_64_PCREL:
12195 case BFD_RELOC_X86_64_GOTOFF64:
12196 case BFD_RELOC_X86_64_GOT64:
12197 case BFD_RELOC_X86_64_GOTPCREL64:
12198 case BFD_RELOC_X86_64_GOTPC64:
12199 case BFD_RELOC_X86_64_GOTPLT64:
12200 case BFD_RELOC_X86_64_PLTOFF64:
12201 as_bad_where (fixp->fx_file, fixp->fx_line,
12202 _("cannot represent relocation type %s in x32 mode"),
12203 bfd_get_reloc_code_name (code));
12204 break;
12205 default:
12206 break;
12207 }
12208
12209 if (!fixp->fx_pcrel)
12210 rel->addend = fixp->fx_offset;
12211 else
12212 switch (code)
12213 {
12214 case BFD_RELOC_X86_64_PLT32:
12215 case BFD_RELOC_X86_64_GOT32:
12216 case BFD_RELOC_X86_64_GOTPCREL:
12217 case BFD_RELOC_X86_64_GOTPCRELX:
12218 case BFD_RELOC_X86_64_REX_GOTPCRELX:
12219 case BFD_RELOC_X86_64_TLSGD:
12220 case BFD_RELOC_X86_64_TLSLD:
12221 case BFD_RELOC_X86_64_GOTTPOFF:
12222 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
12223 case BFD_RELOC_X86_64_TLSDESC_CALL:
12224 rel->addend = fixp->fx_offset - fixp->fx_size;
12225 break;
12226 default:
12227 rel->addend = (section->vma
12228 - fixp->fx_size
12229 + fixp->fx_addnumber
12230 + md_pcrel_from (fixp));
12231 break;
12232 }
12233 }
12234
12235 rel->howto = bfd_reloc_type_lookup (stdoutput, code);
12236 if (rel->howto == NULL)
12237 {
12238 as_bad_where (fixp->fx_file, fixp->fx_line,
12239 _("cannot represent relocation type %s"),
12240 bfd_get_reloc_code_name (code));
12241 /* Set howto to a garbage value so that we can keep going. */
12242 rel->howto = bfd_reloc_type_lookup (stdoutput, BFD_RELOC_32);
12243 gas_assert (rel->howto != NULL);
12244 }
12245
12246 return rel;
12247 }
12248
12249 #include "tc-i386-intel.c"
12250
12251 void
12252 tc_x86_parse_to_dw2regnum (expressionS *exp)
12253 {
12254 int saved_naked_reg;
12255 char saved_register_dot;
12256
12257 saved_naked_reg = allow_naked_reg;
12258 allow_naked_reg = 1;
12259 saved_register_dot = register_chars['.'];
12260 register_chars['.'] = '.';
12261 allow_pseudo_reg = 1;
12262 expression_and_evaluate (exp);
12263 allow_pseudo_reg = 0;
12264 register_chars['.'] = saved_register_dot;
12265 allow_naked_reg = saved_naked_reg;
12266
12267 if (exp->X_op == O_register && exp->X_add_number >= 0)
12268 {
12269 if ((addressT) exp->X_add_number < i386_regtab_size)
12270 {
12271 exp->X_op = O_constant;
12272 exp->X_add_number = i386_regtab[exp->X_add_number]
12273 .dw2_regnum[flag_code >> 1];
12274 }
12275 else
12276 exp->X_op = O_illegal;
12277 }
12278 }
12279
12280 void
12281 tc_x86_frame_initial_instructions (void)
12282 {
12283 static unsigned int sp_regno[2];
12284
12285 if (!sp_regno[flag_code >> 1])
12286 {
12287 char *saved_input = input_line_pointer;
12288 char sp[][4] = {"esp", "rsp"};
12289 expressionS exp;
12290
12291 input_line_pointer = sp[flag_code >> 1];
12292 tc_x86_parse_to_dw2regnum (&exp);
12293 gas_assert (exp.X_op == O_constant);
12294 sp_regno[flag_code >> 1] = exp.X_add_number;
12295 input_line_pointer = saved_input;
12296 }
12297
12298 cfi_add_CFA_def_cfa (sp_regno[flag_code >> 1], -x86_cie_data_alignment);
12299 cfi_add_CFA_offset (x86_dwarf2_return_column, x86_cie_data_alignment);
12300 }
12301
12302 int
12303 x86_dwarf2_addr_size (void)
12304 {
12305 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
12306 if (x86_elf_abi == X86_64_X32_ABI)
12307 return 4;
12308 #endif
12309 return bfd_arch_bits_per_address (stdoutput) / 8;
12310 }
12311
12312 int
12313 i386_elf_section_type (const char *str, size_t len)
12314 {
12315 if (flag_code == CODE_64BIT
12316 && len == sizeof ("unwind") - 1
12317 && strncmp (str, "unwind", 6) == 0)
12318 return SHT_X86_64_UNWIND;
12319
12320 return -1;
12321 }
12322
12323 #ifdef TE_SOLARIS
12324 void
12325 i386_solaris_fix_up_eh_frame (segT sec)
12326 {
12327 if (flag_code == CODE_64BIT)
12328 elf_section_type (sec) = SHT_X86_64_UNWIND;
12329 }
12330 #endif
12331
12332 #ifdef TE_PE
12333 void
12334 tc_pe_dwarf2_emit_offset (symbolS *symbol, unsigned int size)
12335 {
12336 expressionS exp;
12337
12338 exp.X_op = O_secrel;
12339 exp.X_add_symbol = symbol;
12340 exp.X_add_number = 0;
12341 emit_expr (&exp, size);
12342 }
12343 #endif
12344
12345 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12346 /* For ELF on x86-64, add support for SHF_X86_64_LARGE. */
12347
12348 bfd_vma
12349 x86_64_section_letter (int letter, const char **ptr_msg)
12350 {
12351 if (flag_code == CODE_64BIT)
12352 {
12353 if (letter == 'l')
12354 return SHF_X86_64_LARGE;
12355
12356 *ptr_msg = _("bad .section directive: want a,l,w,x,M,S,G,T in string");
12357 }
12358 else
12359 *ptr_msg = _("bad .section directive: want a,w,x,M,S,G,T in string");
12360 return -1;
12361 }
12362
12363 bfd_vma
12364 x86_64_section_word (char *str, size_t len)
12365 {
12366 if (len == 5 && flag_code == CODE_64BIT && CONST_STRNEQ (str, "large"))
12367 return SHF_X86_64_LARGE;
12368
12369 return -1;
12370 }
12371
12372 static void
12373 handle_large_common (int small ATTRIBUTE_UNUSED)
12374 {
12375 if (flag_code != CODE_64BIT)
12376 {
12377 s_comm_internal (0, elf_common_parse);
12378 as_warn (_(".largecomm supported only in 64bit mode, producing .comm"));
12379 }
12380 else
12381 {
12382 static segT lbss_section;
12383 asection *saved_com_section_ptr = elf_com_section_ptr;
12384 asection *saved_bss_section = bss_section;
12385
12386 if (lbss_section == NULL)
12387 {
12388 flagword applicable;
12389 segT seg = now_seg;
12390 subsegT subseg = now_subseg;
12391
12392 /* The .lbss section is for local .largecomm symbols. */
12393 lbss_section = subseg_new (".lbss", 0);
12394 applicable = bfd_applicable_section_flags (stdoutput);
12395 bfd_set_section_flags (lbss_section, applicable & SEC_ALLOC);
12396 seg_info (lbss_section)->bss = 1;
12397
12398 subseg_set (seg, subseg);
12399 }
12400
12401 elf_com_section_ptr = &_bfd_elf_large_com_section;
12402 bss_section = lbss_section;
12403
12404 s_comm_internal (0, elf_common_parse);
12405
12406 elf_com_section_ptr = saved_com_section_ptr;
12407 bss_section = saved_bss_section;
12408 }
12409 }
12410 #endif /* OBJ_ELF || OBJ_MAYBE_ELF */