]> git.ipfire.org Git - thirdparty/binutils-gdb.git/blob - gas/config/tc-i386.c
x86: Add CpuCMOV and CpuFXSR
[thirdparty/binutils-gdb.git] / gas / config / tc-i386.c
1 /* tc-i386.c -- Assemble code for the Intel 80386
2 Copyright (C) 1989-2018 Free Software Foundation, Inc.
3
4 This file is part of GAS, the GNU Assembler.
5
6 GAS is free software; you can redistribute it and/or modify
7 it under the terms of the GNU General Public License as published by
8 the Free Software Foundation; either version 3, or (at your option)
9 any later version.
10
11 GAS is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 GNU General Public License for more details.
15
16 You should have received a copy of the GNU General Public License
17 along with GAS; see the file COPYING. If not, write to the Free
18 Software Foundation, 51 Franklin Street - Fifth Floor, Boston, MA
19 02110-1301, USA. */
20
21 /* Intel 80386 machine specific gas.
22 Written by Eliot Dresselhaus (eliot@mgm.mit.edu).
23 x86_64 support by Jan Hubicka (jh@suse.cz)
24 VIA PadLock support by Michal Ludvig (mludvig@suse.cz)
25 Bugs & suggestions are completely welcome. This is free software.
26 Please help us make it better. */
27
28 #include "as.h"
29 #include "safe-ctype.h"
30 #include "subsegs.h"
31 #include "dwarf2dbg.h"
32 #include "dw2gencfi.h"
33 #include "elf/x86-64.h"
34 #include "opcodes/i386-init.h"
35
36 #ifndef REGISTER_WARNINGS
37 #define REGISTER_WARNINGS 1
38 #endif
39
40 #ifndef INFER_ADDR_PREFIX
41 #define INFER_ADDR_PREFIX 1
42 #endif
43
44 #ifndef DEFAULT_ARCH
45 #define DEFAULT_ARCH "i386"
46 #endif
47
48 #ifndef INLINE
49 #if __GNUC__ >= 2
50 #define INLINE __inline__
51 #else
52 #define INLINE
53 #endif
54 #endif
55
56 /* Prefixes will be emitted in the order defined below.
57 WAIT_PREFIX must be the first prefix since FWAIT is really is an
58 instruction, and so must come before any prefixes.
59 The preferred prefix order is SEG_PREFIX, ADDR_PREFIX, DATA_PREFIX,
60 REP_PREFIX/HLE_PREFIX, LOCK_PREFIX. */
61 #define WAIT_PREFIX 0
62 #define SEG_PREFIX 1
63 #define ADDR_PREFIX 2
64 #define DATA_PREFIX 3
65 #define REP_PREFIX 4
66 #define HLE_PREFIX REP_PREFIX
67 #define BND_PREFIX REP_PREFIX
68 #define LOCK_PREFIX 5
69 #define REX_PREFIX 6 /* must come last. */
70 #define MAX_PREFIXES 7 /* max prefixes per opcode */
71
72 /* we define the syntax here (modulo base,index,scale syntax) */
73 #define REGISTER_PREFIX '%'
74 #define IMMEDIATE_PREFIX '$'
75 #define ABSOLUTE_PREFIX '*'
76
77 /* these are the instruction mnemonic suffixes in AT&T syntax or
78 memory operand size in Intel syntax. */
79 #define WORD_MNEM_SUFFIX 'w'
80 #define BYTE_MNEM_SUFFIX 'b'
81 #define SHORT_MNEM_SUFFIX 's'
82 #define LONG_MNEM_SUFFIX 'l'
83 #define QWORD_MNEM_SUFFIX 'q'
84 /* Intel Syntax. Use a non-ascii letter since since it never appears
85 in instructions. */
86 #define LONG_DOUBLE_MNEM_SUFFIX '\1'
87
88 #define END_OF_INSN '\0'
89
90 /*
91 'templates' is for grouping together 'template' structures for opcodes
92 of the same name. This is only used for storing the insns in the grand
93 ole hash table of insns.
94 The templates themselves start at START and range up to (but not including)
95 END.
96 */
97 typedef struct
98 {
99 const insn_template *start;
100 const insn_template *end;
101 }
102 templates;
103
104 /* 386 operand encoding bytes: see 386 book for details of this. */
105 typedef struct
106 {
107 unsigned int regmem; /* codes register or memory operand */
108 unsigned int reg; /* codes register operand (or extended opcode) */
109 unsigned int mode; /* how to interpret regmem & reg */
110 }
111 modrm_byte;
112
113 /* x86-64 extension prefix. */
114 typedef int rex_byte;
115
116 /* 386 opcode byte to code indirect addressing. */
117 typedef struct
118 {
119 unsigned base;
120 unsigned index;
121 unsigned scale;
122 }
123 sib_byte;
124
125 /* x86 arch names, types and features */
126 typedef struct
127 {
128 const char *name; /* arch name */
129 unsigned int len; /* arch string length */
130 enum processor_type type; /* arch type */
131 i386_cpu_flags flags; /* cpu feature flags */
132 unsigned int skip; /* show_arch should skip this. */
133 }
134 arch_entry;
135
136 /* Used to turn off indicated flags. */
137 typedef struct
138 {
139 const char *name; /* arch name */
140 unsigned int len; /* arch string length */
141 i386_cpu_flags flags; /* cpu feature flags */
142 }
143 noarch_entry;
144
145 static void update_code_flag (int, int);
146 static void set_code_flag (int);
147 static void set_16bit_gcc_code_flag (int);
148 static void set_intel_syntax (int);
149 static void set_intel_mnemonic (int);
150 static void set_allow_index_reg (int);
151 static void set_check (int);
152 static void set_cpu_arch (int);
153 #ifdef TE_PE
154 static void pe_directive_secrel (int);
155 #endif
156 static void signed_cons (int);
157 static char *output_invalid (int c);
158 static int i386_finalize_immediate (segT, expressionS *, i386_operand_type,
159 const char *);
160 static int i386_finalize_displacement (segT, expressionS *, i386_operand_type,
161 const char *);
162 static int i386_att_operand (char *);
163 static int i386_intel_operand (char *, int);
164 static int i386_intel_simplify (expressionS *);
165 static int i386_intel_parse_name (const char *, expressionS *);
166 static const reg_entry *parse_register (char *, char **);
167 static char *parse_insn (char *, char *);
168 static char *parse_operands (char *, const char *);
169 static void swap_operands (void);
170 static void swap_2_operands (int, int);
171 static void optimize_imm (void);
172 static void optimize_disp (void);
173 static const insn_template *match_template (char);
174 static int check_string (void);
175 static int process_suffix (void);
176 static int check_byte_reg (void);
177 static int check_long_reg (void);
178 static int check_qword_reg (void);
179 static int check_word_reg (void);
180 static int finalize_imm (void);
181 static int process_operands (void);
182 static const seg_entry *build_modrm_byte (void);
183 static void output_insn (void);
184 static void output_imm (fragS *, offsetT);
185 static void output_disp (fragS *, offsetT);
186 #ifndef I386COFF
187 static void s_bss (int);
188 #endif
189 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
190 static void handle_large_common (int small ATTRIBUTE_UNUSED);
191 #endif
192
193 static const char *default_arch = DEFAULT_ARCH;
194
195 /* This struct describes rounding control and SAE in the instruction. */
196 struct RC_Operation
197 {
198 enum rc_type
199 {
200 rne = 0,
201 rd,
202 ru,
203 rz,
204 saeonly
205 } type;
206 int operand;
207 };
208
209 static struct RC_Operation rc_op;
210
211 /* The struct describes masking, applied to OPERAND in the instruction.
212 MASK is a pointer to the corresponding mask register. ZEROING tells
213 whether merging or zeroing mask is used. */
214 struct Mask_Operation
215 {
216 const reg_entry *mask;
217 unsigned int zeroing;
218 /* The operand where this operation is associated. */
219 int operand;
220 };
221
222 static struct Mask_Operation mask_op;
223
224 /* The struct describes broadcasting, applied to OPERAND. FACTOR is
225 broadcast factor. */
226 struct Broadcast_Operation
227 {
228 /* Type of broadcast: {1to2}, {1to4}, {1to8}, or {1to16}. */
229 int type;
230
231 /* Index of broadcasted operand. */
232 int operand;
233
234 /* Number of bytes to broadcast. */
235 int bytes;
236 };
237
238 static struct Broadcast_Operation broadcast_op;
239
240 /* VEX prefix. */
241 typedef struct
242 {
243 /* VEX prefix is either 2 byte or 3 byte. EVEX is 4 byte. */
244 unsigned char bytes[4];
245 unsigned int length;
246 /* Destination or source register specifier. */
247 const reg_entry *register_specifier;
248 } vex_prefix;
249
250 /* 'md_assemble ()' gathers together information and puts it into a
251 i386_insn. */
252
253 union i386_op
254 {
255 expressionS *disps;
256 expressionS *imms;
257 const reg_entry *regs;
258 };
259
260 enum i386_error
261 {
262 operand_size_mismatch,
263 operand_type_mismatch,
264 register_type_mismatch,
265 number_of_operands_mismatch,
266 invalid_instruction_suffix,
267 bad_imm4,
268 unsupported_with_intel_mnemonic,
269 unsupported_syntax,
270 unsupported,
271 invalid_vsib_address,
272 invalid_vector_register_set,
273 unsupported_vector_index_register,
274 unsupported_broadcast,
275 broadcast_needed,
276 unsupported_masking,
277 mask_not_on_destination,
278 no_default_mask,
279 unsupported_rc_sae,
280 rc_sae_operand_not_last_imm,
281 invalid_register_operand,
282 };
283
284 struct _i386_insn
285 {
286 /* TM holds the template for the insn were currently assembling. */
287 insn_template tm;
288
289 /* SUFFIX holds the instruction size suffix for byte, word, dword
290 or qword, if given. */
291 char suffix;
292
293 /* OPERANDS gives the number of given operands. */
294 unsigned int operands;
295
296 /* REG_OPERANDS, DISP_OPERANDS, MEM_OPERANDS, IMM_OPERANDS give the number
297 of given register, displacement, memory operands and immediate
298 operands. */
299 unsigned int reg_operands, disp_operands, mem_operands, imm_operands;
300
301 /* TYPES [i] is the type (see above #defines) which tells us how to
302 use OP[i] for the corresponding operand. */
303 i386_operand_type types[MAX_OPERANDS];
304
305 /* Displacement expression, immediate expression, or register for each
306 operand. */
307 union i386_op op[MAX_OPERANDS];
308
309 /* Flags for operands. */
310 unsigned int flags[MAX_OPERANDS];
311 #define Operand_PCrel 1
312 #define Operand_Mem 2
313
314 /* Relocation type for operand */
315 enum bfd_reloc_code_real reloc[MAX_OPERANDS];
316
317 /* BASE_REG, INDEX_REG, and LOG2_SCALE_FACTOR are used to encode
318 the base index byte below. */
319 const reg_entry *base_reg;
320 const reg_entry *index_reg;
321 unsigned int log2_scale_factor;
322
323 /* SEG gives the seg_entries of this insn. They are zero unless
324 explicit segment overrides are given. */
325 const seg_entry *seg[2];
326
327 /* Copied first memory operand string, for re-checking. */
328 char *memop1_string;
329
330 /* PREFIX holds all the given prefix opcodes (usually null).
331 PREFIXES is the number of prefix opcodes. */
332 unsigned int prefixes;
333 unsigned char prefix[MAX_PREFIXES];
334
335 /* RM and SIB are the modrm byte and the sib byte where the
336 addressing modes of this insn are encoded. */
337 modrm_byte rm;
338 rex_byte rex;
339 rex_byte vrex;
340 sib_byte sib;
341 vex_prefix vex;
342
343 /* Masking attributes. */
344 struct Mask_Operation *mask;
345
346 /* Rounding control and SAE attributes. */
347 struct RC_Operation *rounding;
348
349 /* Broadcasting attributes. */
350 struct Broadcast_Operation *broadcast;
351
352 /* Compressed disp8*N attribute. */
353 unsigned int memshift;
354
355 /* Prefer load or store in encoding. */
356 enum
357 {
358 dir_encoding_default = 0,
359 dir_encoding_load,
360 dir_encoding_store
361 } dir_encoding;
362
363 /* Prefer 8bit or 32bit displacement in encoding. */
364 enum
365 {
366 disp_encoding_default = 0,
367 disp_encoding_8bit,
368 disp_encoding_32bit
369 } disp_encoding;
370
371 /* Prefer the REX byte in encoding. */
372 bfd_boolean rex_encoding;
373
374 /* Disable instruction size optimization. */
375 bfd_boolean no_optimize;
376
377 /* How to encode vector instructions. */
378 enum
379 {
380 vex_encoding_default = 0,
381 vex_encoding_vex2,
382 vex_encoding_vex3,
383 vex_encoding_evex
384 } vec_encoding;
385
386 /* REP prefix. */
387 const char *rep_prefix;
388
389 /* HLE prefix. */
390 const char *hle_prefix;
391
392 /* Have BND prefix. */
393 const char *bnd_prefix;
394
395 /* Have NOTRACK prefix. */
396 const char *notrack_prefix;
397
398 /* Error message. */
399 enum i386_error error;
400 };
401
402 typedef struct _i386_insn i386_insn;
403
404 /* Link RC type with corresponding string, that'll be looked for in
405 asm. */
406 struct RC_name
407 {
408 enum rc_type type;
409 const char *name;
410 unsigned int len;
411 };
412
413 static const struct RC_name RC_NamesTable[] =
414 {
415 { rne, STRING_COMMA_LEN ("rn-sae") },
416 { rd, STRING_COMMA_LEN ("rd-sae") },
417 { ru, STRING_COMMA_LEN ("ru-sae") },
418 { rz, STRING_COMMA_LEN ("rz-sae") },
419 { saeonly, STRING_COMMA_LEN ("sae") },
420 };
421
422 /* List of chars besides those in app.c:symbol_chars that can start an
423 operand. Used to prevent the scrubber eating vital white-space. */
424 const char extra_symbol_chars[] = "*%-([{}"
425 #ifdef LEX_AT
426 "@"
427 #endif
428 #ifdef LEX_QM
429 "?"
430 #endif
431 ;
432
433 #if (defined (TE_I386AIX) \
434 || ((defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)) \
435 && !defined (TE_GNU) \
436 && !defined (TE_LINUX) \
437 && !defined (TE_NACL) \
438 && !defined (TE_FreeBSD) \
439 && !defined (TE_DragonFly) \
440 && !defined (TE_NetBSD)))
441 /* This array holds the chars that always start a comment. If the
442 pre-processor is disabled, these aren't very useful. The option
443 --divide will remove '/' from this list. */
444 const char *i386_comment_chars = "#/";
445 #define SVR4_COMMENT_CHARS 1
446 #define PREFIX_SEPARATOR '\\'
447
448 #else
449 const char *i386_comment_chars = "#";
450 #define PREFIX_SEPARATOR '/'
451 #endif
452
453 /* This array holds the chars that only start a comment at the beginning of
454 a line. If the line seems to have the form '# 123 filename'
455 .line and .file directives will appear in the pre-processed output.
456 Note that input_file.c hand checks for '#' at the beginning of the
457 first line of the input file. This is because the compiler outputs
458 #NO_APP at the beginning of its output.
459 Also note that comments started like this one will always work if
460 '/' isn't otherwise defined. */
461 const char line_comment_chars[] = "#/";
462
463 const char line_separator_chars[] = ";";
464
465 /* Chars that can be used to separate mant from exp in floating point
466 nums. */
467 const char EXP_CHARS[] = "eE";
468
469 /* Chars that mean this number is a floating point constant
470 As in 0f12.456
471 or 0d1.2345e12. */
472 const char FLT_CHARS[] = "fFdDxX";
473
474 /* Tables for lexical analysis. */
475 static char mnemonic_chars[256];
476 static char register_chars[256];
477 static char operand_chars[256];
478 static char identifier_chars[256];
479 static char digit_chars[256];
480
481 /* Lexical macros. */
482 #define is_mnemonic_char(x) (mnemonic_chars[(unsigned char) x])
483 #define is_operand_char(x) (operand_chars[(unsigned char) x])
484 #define is_register_char(x) (register_chars[(unsigned char) x])
485 #define is_space_char(x) ((x) == ' ')
486 #define is_identifier_char(x) (identifier_chars[(unsigned char) x])
487 #define is_digit_char(x) (digit_chars[(unsigned char) x])
488
489 /* All non-digit non-letter characters that may occur in an operand. */
490 static char operand_special_chars[] = "%$-+(,)*._~/<>|&^!:[@]";
491
492 /* md_assemble() always leaves the strings it's passed unaltered. To
493 effect this we maintain a stack of saved characters that we've smashed
494 with '\0's (indicating end of strings for various sub-fields of the
495 assembler instruction). */
496 static char save_stack[32];
497 static char *save_stack_p;
498 #define END_STRING_AND_SAVE(s) \
499 do { *save_stack_p++ = *(s); *(s) = '\0'; } while (0)
500 #define RESTORE_END_STRING(s) \
501 do { *(s) = *--save_stack_p; } while (0)
502
503 /* The instruction we're assembling. */
504 static i386_insn i;
505
506 /* Possible templates for current insn. */
507 static const templates *current_templates;
508
509 /* Per instruction expressionS buffers: max displacements & immediates. */
510 static expressionS disp_expressions[MAX_MEMORY_OPERANDS];
511 static expressionS im_expressions[MAX_IMMEDIATE_OPERANDS];
512
513 /* Current operand we are working on. */
514 static int this_operand = -1;
515
516 /* We support four different modes. FLAG_CODE variable is used to distinguish
517 these. */
518
519 enum flag_code {
520 CODE_32BIT,
521 CODE_16BIT,
522 CODE_64BIT };
523
524 static enum flag_code flag_code;
525 static unsigned int object_64bit;
526 static unsigned int disallow_64bit_reloc;
527 static int use_rela_relocations = 0;
528
529 #if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
530 || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
531 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
532
533 /* The ELF ABI to use. */
534 enum x86_elf_abi
535 {
536 I386_ABI,
537 X86_64_ABI,
538 X86_64_X32_ABI
539 };
540
541 static enum x86_elf_abi x86_elf_abi = I386_ABI;
542 #endif
543
544 #if defined (TE_PE) || defined (TE_PEP)
545 /* Use big object file format. */
546 static int use_big_obj = 0;
547 #endif
548
549 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
550 /* 1 if generating code for a shared library. */
551 static int shared = 0;
552 #endif
553
554 /* 1 for intel syntax,
555 0 if att syntax. */
556 static int intel_syntax = 0;
557
558 /* 1 for Intel64 ISA,
559 0 if AMD64 ISA. */
560 static int intel64;
561
562 /* 1 for intel mnemonic,
563 0 if att mnemonic. */
564 static int intel_mnemonic = !SYSV386_COMPAT;
565
566 /* 1 if pseudo registers are permitted. */
567 static int allow_pseudo_reg = 0;
568
569 /* 1 if register prefix % not required. */
570 static int allow_naked_reg = 0;
571
572 /* 1 if the assembler should add BND prefix for all control-transferring
573 instructions supporting it, even if this prefix wasn't specified
574 explicitly. */
575 static int add_bnd_prefix = 0;
576
577 /* 1 if pseudo index register, eiz/riz, is allowed . */
578 static int allow_index_reg = 0;
579
580 /* 1 if the assembler should ignore LOCK prefix, even if it was
581 specified explicitly. */
582 static int omit_lock_prefix = 0;
583
584 /* 1 if the assembler should encode lfence, mfence, and sfence as
585 "lock addl $0, (%{re}sp)". */
586 static int avoid_fence = 0;
587
588 /* 1 if the assembler should generate relax relocations. */
589
590 static int generate_relax_relocations
591 = DEFAULT_GENERATE_X86_RELAX_RELOCATIONS;
592
593 static enum check_kind
594 {
595 check_none = 0,
596 check_warning,
597 check_error
598 }
599 sse_check, operand_check = check_warning;
600
601 /* Optimization:
602 1. Clear the REX_W bit with register operand if possible.
603 2. Above plus use 128bit vector instruction to clear the full vector
604 register.
605 */
606 static int optimize = 0;
607
608 /* Optimization:
609 1. Clear the REX_W bit with register operand if possible.
610 2. Above plus use 128bit vector instruction to clear the full vector
611 register.
612 3. Above plus optimize "test{q,l,w} $imm8,%r{64,32,16}" to
613 "testb $imm7,%r8".
614 */
615 static int optimize_for_space = 0;
616
617 /* Register prefix used for error message. */
618 static const char *register_prefix = "%";
619
620 /* Used in 16 bit gcc mode to add an l suffix to call, ret, enter,
621 leave, push, and pop instructions so that gcc has the same stack
622 frame as in 32 bit mode. */
623 static char stackop_size = '\0';
624
625 /* Non-zero to optimize code alignment. */
626 int optimize_align_code = 1;
627
628 /* Non-zero to quieten some warnings. */
629 static int quiet_warnings = 0;
630
631 /* CPU name. */
632 static const char *cpu_arch_name = NULL;
633 static char *cpu_sub_arch_name = NULL;
634
635 /* CPU feature flags. */
636 static i386_cpu_flags cpu_arch_flags = CPU_UNKNOWN_FLAGS;
637
638 /* If we have selected a cpu we are generating instructions for. */
639 static int cpu_arch_tune_set = 0;
640
641 /* Cpu we are generating instructions for. */
642 enum processor_type cpu_arch_tune = PROCESSOR_UNKNOWN;
643
644 /* CPU feature flags of cpu we are generating instructions for. */
645 static i386_cpu_flags cpu_arch_tune_flags;
646
647 /* CPU instruction set architecture used. */
648 enum processor_type cpu_arch_isa = PROCESSOR_UNKNOWN;
649
650 /* CPU feature flags of instruction set architecture used. */
651 i386_cpu_flags cpu_arch_isa_flags;
652
653 /* If set, conditional jumps are not automatically promoted to handle
654 larger than a byte offset. */
655 static unsigned int no_cond_jump_promotion = 0;
656
657 /* Encode SSE instructions with VEX prefix. */
658 static unsigned int sse2avx;
659
660 /* Encode scalar AVX instructions with specific vector length. */
661 static enum
662 {
663 vex128 = 0,
664 vex256
665 } avxscalar;
666
667 /* Encode scalar EVEX LIG instructions with specific vector length. */
668 static enum
669 {
670 evexl128 = 0,
671 evexl256,
672 evexl512
673 } evexlig;
674
675 /* Encode EVEX WIG instructions with specific evex.w. */
676 static enum
677 {
678 evexw0 = 0,
679 evexw1
680 } evexwig;
681
682 /* Value to encode in EVEX RC bits, for SAE-only instructions. */
683 static enum rc_type evexrcig = rne;
684
685 /* Pre-defined "_GLOBAL_OFFSET_TABLE_". */
686 static symbolS *GOT_symbol;
687
688 /* The dwarf2 return column, adjusted for 32 or 64 bit. */
689 unsigned int x86_dwarf2_return_column;
690
691 /* The dwarf2 data alignment, adjusted for 32 or 64 bit. */
692 int x86_cie_data_alignment;
693
694 /* Interface to relax_segment.
695 There are 3 major relax states for 386 jump insns because the
696 different types of jumps add different sizes to frags when we're
697 figuring out what sort of jump to choose to reach a given label. */
698
699 /* Types. */
700 #define UNCOND_JUMP 0
701 #define COND_JUMP 1
702 #define COND_JUMP86 2
703
704 /* Sizes. */
705 #define CODE16 1
706 #define SMALL 0
707 #define SMALL16 (SMALL | CODE16)
708 #define BIG 2
709 #define BIG16 (BIG | CODE16)
710
711 #ifndef INLINE
712 #ifdef __GNUC__
713 #define INLINE __inline__
714 #else
715 #define INLINE
716 #endif
717 #endif
718
719 #define ENCODE_RELAX_STATE(type, size) \
720 ((relax_substateT) (((type) << 2) | (size)))
721 #define TYPE_FROM_RELAX_STATE(s) \
722 ((s) >> 2)
723 #define DISP_SIZE_FROM_RELAX_STATE(s) \
724 ((((s) & 3) == BIG ? 4 : (((s) & 3) == BIG16 ? 2 : 1)))
725
726 /* This table is used by relax_frag to promote short jumps to long
727 ones where necessary. SMALL (short) jumps may be promoted to BIG
728 (32 bit long) ones, and SMALL16 jumps to BIG16 (16 bit long). We
729 don't allow a short jump in a 32 bit code segment to be promoted to
730 a 16 bit offset jump because it's slower (requires data size
731 prefix), and doesn't work, unless the destination is in the bottom
732 64k of the code segment (The top 16 bits of eip are zeroed). */
733
734 const relax_typeS md_relax_table[] =
735 {
736 /* The fields are:
737 1) most positive reach of this state,
738 2) most negative reach of this state,
739 3) how many bytes this mode will have in the variable part of the frag
740 4) which index into the table to try if we can't fit into this one. */
741
742 /* UNCOND_JUMP states. */
743 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG)},
744 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16)},
745 /* dword jmp adds 4 bytes to frag:
746 0 extra opcode bytes, 4 displacement bytes. */
747 {0, 0, 4, 0},
748 /* word jmp adds 2 byte2 to frag:
749 0 extra opcode bytes, 2 displacement bytes. */
750 {0, 0, 2, 0},
751
752 /* COND_JUMP states. */
753 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG)},
754 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG16)},
755 /* dword conditionals adds 5 bytes to frag:
756 1 extra opcode byte, 4 displacement bytes. */
757 {0, 0, 5, 0},
758 /* word conditionals add 3 bytes to frag:
759 1 extra opcode byte, 2 displacement bytes. */
760 {0, 0, 3, 0},
761
762 /* COND_JUMP86 states. */
763 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG)},
764 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG16)},
765 /* dword conditionals adds 5 bytes to frag:
766 1 extra opcode byte, 4 displacement bytes. */
767 {0, 0, 5, 0},
768 /* word conditionals add 4 bytes to frag:
769 1 displacement byte and a 3 byte long branch insn. */
770 {0, 0, 4, 0}
771 };
772
773 static const arch_entry cpu_arch[] =
774 {
775 /* Do not replace the first two entries - i386_target_format()
776 relies on them being there in this order. */
777 { STRING_COMMA_LEN ("generic32"), PROCESSOR_GENERIC32,
778 CPU_GENERIC32_FLAGS, 0 },
779 { STRING_COMMA_LEN ("generic64"), PROCESSOR_GENERIC64,
780 CPU_GENERIC64_FLAGS, 0 },
781 { STRING_COMMA_LEN ("i8086"), PROCESSOR_UNKNOWN,
782 CPU_NONE_FLAGS, 0 },
783 { STRING_COMMA_LEN ("i186"), PROCESSOR_UNKNOWN,
784 CPU_I186_FLAGS, 0 },
785 { STRING_COMMA_LEN ("i286"), PROCESSOR_UNKNOWN,
786 CPU_I286_FLAGS, 0 },
787 { STRING_COMMA_LEN ("i386"), PROCESSOR_I386,
788 CPU_I386_FLAGS, 0 },
789 { STRING_COMMA_LEN ("i486"), PROCESSOR_I486,
790 CPU_I486_FLAGS, 0 },
791 { STRING_COMMA_LEN ("i586"), PROCESSOR_PENTIUM,
792 CPU_I586_FLAGS, 0 },
793 { STRING_COMMA_LEN ("i686"), PROCESSOR_PENTIUMPRO,
794 CPU_I686_FLAGS, 0 },
795 { STRING_COMMA_LEN ("pentium"), PROCESSOR_PENTIUM,
796 CPU_I586_FLAGS, 0 },
797 { STRING_COMMA_LEN ("pentiumpro"), PROCESSOR_PENTIUMPRO,
798 CPU_PENTIUMPRO_FLAGS, 0 },
799 { STRING_COMMA_LEN ("pentiumii"), PROCESSOR_PENTIUMPRO,
800 CPU_P2_FLAGS, 0 },
801 { STRING_COMMA_LEN ("pentiumiii"),PROCESSOR_PENTIUMPRO,
802 CPU_P3_FLAGS, 0 },
803 { STRING_COMMA_LEN ("pentium4"), PROCESSOR_PENTIUM4,
804 CPU_P4_FLAGS, 0 },
805 { STRING_COMMA_LEN ("prescott"), PROCESSOR_NOCONA,
806 CPU_CORE_FLAGS, 0 },
807 { STRING_COMMA_LEN ("nocona"), PROCESSOR_NOCONA,
808 CPU_NOCONA_FLAGS, 0 },
809 { STRING_COMMA_LEN ("yonah"), PROCESSOR_CORE,
810 CPU_CORE_FLAGS, 1 },
811 { STRING_COMMA_LEN ("core"), PROCESSOR_CORE,
812 CPU_CORE_FLAGS, 0 },
813 { STRING_COMMA_LEN ("merom"), PROCESSOR_CORE2,
814 CPU_CORE2_FLAGS, 1 },
815 { STRING_COMMA_LEN ("core2"), PROCESSOR_CORE2,
816 CPU_CORE2_FLAGS, 0 },
817 { STRING_COMMA_LEN ("corei7"), PROCESSOR_COREI7,
818 CPU_COREI7_FLAGS, 0 },
819 { STRING_COMMA_LEN ("l1om"), PROCESSOR_L1OM,
820 CPU_L1OM_FLAGS, 0 },
821 { STRING_COMMA_LEN ("k1om"), PROCESSOR_K1OM,
822 CPU_K1OM_FLAGS, 0 },
823 { STRING_COMMA_LEN ("iamcu"), PROCESSOR_IAMCU,
824 CPU_IAMCU_FLAGS, 0 },
825 { STRING_COMMA_LEN ("k6"), PROCESSOR_K6,
826 CPU_K6_FLAGS, 0 },
827 { STRING_COMMA_LEN ("k6_2"), PROCESSOR_K6,
828 CPU_K6_2_FLAGS, 0 },
829 { STRING_COMMA_LEN ("athlon"), PROCESSOR_ATHLON,
830 CPU_ATHLON_FLAGS, 0 },
831 { STRING_COMMA_LEN ("sledgehammer"), PROCESSOR_K8,
832 CPU_K8_FLAGS, 1 },
833 { STRING_COMMA_LEN ("opteron"), PROCESSOR_K8,
834 CPU_K8_FLAGS, 0 },
835 { STRING_COMMA_LEN ("k8"), PROCESSOR_K8,
836 CPU_K8_FLAGS, 0 },
837 { STRING_COMMA_LEN ("amdfam10"), PROCESSOR_AMDFAM10,
838 CPU_AMDFAM10_FLAGS, 0 },
839 { STRING_COMMA_LEN ("bdver1"), PROCESSOR_BD,
840 CPU_BDVER1_FLAGS, 0 },
841 { STRING_COMMA_LEN ("bdver2"), PROCESSOR_BD,
842 CPU_BDVER2_FLAGS, 0 },
843 { STRING_COMMA_LEN ("bdver3"), PROCESSOR_BD,
844 CPU_BDVER3_FLAGS, 0 },
845 { STRING_COMMA_LEN ("bdver4"), PROCESSOR_BD,
846 CPU_BDVER4_FLAGS, 0 },
847 { STRING_COMMA_LEN ("znver1"), PROCESSOR_ZNVER,
848 CPU_ZNVER1_FLAGS, 0 },
849 { STRING_COMMA_LEN ("znver2"), PROCESSOR_ZNVER,
850 CPU_ZNVER2_FLAGS, 0 },
851 { STRING_COMMA_LEN ("btver1"), PROCESSOR_BT,
852 CPU_BTVER1_FLAGS, 0 },
853 { STRING_COMMA_LEN ("btver2"), PROCESSOR_BT,
854 CPU_BTVER2_FLAGS, 0 },
855 { STRING_COMMA_LEN (".8087"), PROCESSOR_UNKNOWN,
856 CPU_8087_FLAGS, 0 },
857 { STRING_COMMA_LEN (".287"), PROCESSOR_UNKNOWN,
858 CPU_287_FLAGS, 0 },
859 { STRING_COMMA_LEN (".387"), PROCESSOR_UNKNOWN,
860 CPU_387_FLAGS, 0 },
861 { STRING_COMMA_LEN (".687"), PROCESSOR_UNKNOWN,
862 CPU_687_FLAGS, 0 },
863 { STRING_COMMA_LEN (".cmov"), PROCESSOR_UNKNOWN,
864 CPU_CMOV_FLAGS, 0 },
865 { STRING_COMMA_LEN (".fxsr"), PROCESSOR_UNKNOWN,
866 CPU_FXSR_FLAGS, 0 },
867 { STRING_COMMA_LEN (".mmx"), PROCESSOR_UNKNOWN,
868 CPU_MMX_FLAGS, 0 },
869 { STRING_COMMA_LEN (".sse"), PROCESSOR_UNKNOWN,
870 CPU_SSE_FLAGS, 0 },
871 { STRING_COMMA_LEN (".sse2"), PROCESSOR_UNKNOWN,
872 CPU_SSE2_FLAGS, 0 },
873 { STRING_COMMA_LEN (".sse3"), PROCESSOR_UNKNOWN,
874 CPU_SSE3_FLAGS, 0 },
875 { STRING_COMMA_LEN (".ssse3"), PROCESSOR_UNKNOWN,
876 CPU_SSSE3_FLAGS, 0 },
877 { STRING_COMMA_LEN (".sse4.1"), PROCESSOR_UNKNOWN,
878 CPU_SSE4_1_FLAGS, 0 },
879 { STRING_COMMA_LEN (".sse4.2"), PROCESSOR_UNKNOWN,
880 CPU_SSE4_2_FLAGS, 0 },
881 { STRING_COMMA_LEN (".sse4"), PROCESSOR_UNKNOWN,
882 CPU_SSE4_2_FLAGS, 0 },
883 { STRING_COMMA_LEN (".avx"), PROCESSOR_UNKNOWN,
884 CPU_AVX_FLAGS, 0 },
885 { STRING_COMMA_LEN (".avx2"), PROCESSOR_UNKNOWN,
886 CPU_AVX2_FLAGS, 0 },
887 { STRING_COMMA_LEN (".avx512f"), PROCESSOR_UNKNOWN,
888 CPU_AVX512F_FLAGS, 0 },
889 { STRING_COMMA_LEN (".avx512cd"), PROCESSOR_UNKNOWN,
890 CPU_AVX512CD_FLAGS, 0 },
891 { STRING_COMMA_LEN (".avx512er"), PROCESSOR_UNKNOWN,
892 CPU_AVX512ER_FLAGS, 0 },
893 { STRING_COMMA_LEN (".avx512pf"), PROCESSOR_UNKNOWN,
894 CPU_AVX512PF_FLAGS, 0 },
895 { STRING_COMMA_LEN (".avx512dq"), PROCESSOR_UNKNOWN,
896 CPU_AVX512DQ_FLAGS, 0 },
897 { STRING_COMMA_LEN (".avx512bw"), PROCESSOR_UNKNOWN,
898 CPU_AVX512BW_FLAGS, 0 },
899 { STRING_COMMA_LEN (".avx512vl"), PROCESSOR_UNKNOWN,
900 CPU_AVX512VL_FLAGS, 0 },
901 { STRING_COMMA_LEN (".vmx"), PROCESSOR_UNKNOWN,
902 CPU_VMX_FLAGS, 0 },
903 { STRING_COMMA_LEN (".vmfunc"), PROCESSOR_UNKNOWN,
904 CPU_VMFUNC_FLAGS, 0 },
905 { STRING_COMMA_LEN (".smx"), PROCESSOR_UNKNOWN,
906 CPU_SMX_FLAGS, 0 },
907 { STRING_COMMA_LEN (".xsave"), PROCESSOR_UNKNOWN,
908 CPU_XSAVE_FLAGS, 0 },
909 { STRING_COMMA_LEN (".xsaveopt"), PROCESSOR_UNKNOWN,
910 CPU_XSAVEOPT_FLAGS, 0 },
911 { STRING_COMMA_LEN (".xsavec"), PROCESSOR_UNKNOWN,
912 CPU_XSAVEC_FLAGS, 0 },
913 { STRING_COMMA_LEN (".xsaves"), PROCESSOR_UNKNOWN,
914 CPU_XSAVES_FLAGS, 0 },
915 { STRING_COMMA_LEN (".aes"), PROCESSOR_UNKNOWN,
916 CPU_AES_FLAGS, 0 },
917 { STRING_COMMA_LEN (".pclmul"), PROCESSOR_UNKNOWN,
918 CPU_PCLMUL_FLAGS, 0 },
919 { STRING_COMMA_LEN (".clmul"), PROCESSOR_UNKNOWN,
920 CPU_PCLMUL_FLAGS, 1 },
921 { STRING_COMMA_LEN (".fsgsbase"), PROCESSOR_UNKNOWN,
922 CPU_FSGSBASE_FLAGS, 0 },
923 { STRING_COMMA_LEN (".rdrnd"), PROCESSOR_UNKNOWN,
924 CPU_RDRND_FLAGS, 0 },
925 { STRING_COMMA_LEN (".f16c"), PROCESSOR_UNKNOWN,
926 CPU_F16C_FLAGS, 0 },
927 { STRING_COMMA_LEN (".bmi2"), PROCESSOR_UNKNOWN,
928 CPU_BMI2_FLAGS, 0 },
929 { STRING_COMMA_LEN (".fma"), PROCESSOR_UNKNOWN,
930 CPU_FMA_FLAGS, 0 },
931 { STRING_COMMA_LEN (".fma4"), PROCESSOR_UNKNOWN,
932 CPU_FMA4_FLAGS, 0 },
933 { STRING_COMMA_LEN (".xop"), PROCESSOR_UNKNOWN,
934 CPU_XOP_FLAGS, 0 },
935 { STRING_COMMA_LEN (".lwp"), PROCESSOR_UNKNOWN,
936 CPU_LWP_FLAGS, 0 },
937 { STRING_COMMA_LEN (".movbe"), PROCESSOR_UNKNOWN,
938 CPU_MOVBE_FLAGS, 0 },
939 { STRING_COMMA_LEN (".cx16"), PROCESSOR_UNKNOWN,
940 CPU_CX16_FLAGS, 0 },
941 { STRING_COMMA_LEN (".ept"), PROCESSOR_UNKNOWN,
942 CPU_EPT_FLAGS, 0 },
943 { STRING_COMMA_LEN (".lzcnt"), PROCESSOR_UNKNOWN,
944 CPU_LZCNT_FLAGS, 0 },
945 { STRING_COMMA_LEN (".hle"), PROCESSOR_UNKNOWN,
946 CPU_HLE_FLAGS, 0 },
947 { STRING_COMMA_LEN (".rtm"), PROCESSOR_UNKNOWN,
948 CPU_RTM_FLAGS, 0 },
949 { STRING_COMMA_LEN (".invpcid"), PROCESSOR_UNKNOWN,
950 CPU_INVPCID_FLAGS, 0 },
951 { STRING_COMMA_LEN (".clflush"), PROCESSOR_UNKNOWN,
952 CPU_CLFLUSH_FLAGS, 0 },
953 { STRING_COMMA_LEN (".nop"), PROCESSOR_UNKNOWN,
954 CPU_NOP_FLAGS, 0 },
955 { STRING_COMMA_LEN (".syscall"), PROCESSOR_UNKNOWN,
956 CPU_SYSCALL_FLAGS, 0 },
957 { STRING_COMMA_LEN (".rdtscp"), PROCESSOR_UNKNOWN,
958 CPU_RDTSCP_FLAGS, 0 },
959 { STRING_COMMA_LEN (".3dnow"), PROCESSOR_UNKNOWN,
960 CPU_3DNOW_FLAGS, 0 },
961 { STRING_COMMA_LEN (".3dnowa"), PROCESSOR_UNKNOWN,
962 CPU_3DNOWA_FLAGS, 0 },
963 { STRING_COMMA_LEN (".padlock"), PROCESSOR_UNKNOWN,
964 CPU_PADLOCK_FLAGS, 0 },
965 { STRING_COMMA_LEN (".pacifica"), PROCESSOR_UNKNOWN,
966 CPU_SVME_FLAGS, 1 },
967 { STRING_COMMA_LEN (".svme"), PROCESSOR_UNKNOWN,
968 CPU_SVME_FLAGS, 0 },
969 { STRING_COMMA_LEN (".sse4a"), PROCESSOR_UNKNOWN,
970 CPU_SSE4A_FLAGS, 0 },
971 { STRING_COMMA_LEN (".abm"), PROCESSOR_UNKNOWN,
972 CPU_ABM_FLAGS, 0 },
973 { STRING_COMMA_LEN (".bmi"), PROCESSOR_UNKNOWN,
974 CPU_BMI_FLAGS, 0 },
975 { STRING_COMMA_LEN (".tbm"), PROCESSOR_UNKNOWN,
976 CPU_TBM_FLAGS, 0 },
977 { STRING_COMMA_LEN (".adx"), PROCESSOR_UNKNOWN,
978 CPU_ADX_FLAGS, 0 },
979 { STRING_COMMA_LEN (".rdseed"), PROCESSOR_UNKNOWN,
980 CPU_RDSEED_FLAGS, 0 },
981 { STRING_COMMA_LEN (".prfchw"), PROCESSOR_UNKNOWN,
982 CPU_PRFCHW_FLAGS, 0 },
983 { STRING_COMMA_LEN (".smap"), PROCESSOR_UNKNOWN,
984 CPU_SMAP_FLAGS, 0 },
985 { STRING_COMMA_LEN (".mpx"), PROCESSOR_UNKNOWN,
986 CPU_MPX_FLAGS, 0 },
987 { STRING_COMMA_LEN (".sha"), PROCESSOR_UNKNOWN,
988 CPU_SHA_FLAGS, 0 },
989 { STRING_COMMA_LEN (".clflushopt"), PROCESSOR_UNKNOWN,
990 CPU_CLFLUSHOPT_FLAGS, 0 },
991 { STRING_COMMA_LEN (".prefetchwt1"), PROCESSOR_UNKNOWN,
992 CPU_PREFETCHWT1_FLAGS, 0 },
993 { STRING_COMMA_LEN (".se1"), PROCESSOR_UNKNOWN,
994 CPU_SE1_FLAGS, 0 },
995 { STRING_COMMA_LEN (".clwb"), PROCESSOR_UNKNOWN,
996 CPU_CLWB_FLAGS, 0 },
997 { STRING_COMMA_LEN (".avx512ifma"), PROCESSOR_UNKNOWN,
998 CPU_AVX512IFMA_FLAGS, 0 },
999 { STRING_COMMA_LEN (".avx512vbmi"), PROCESSOR_UNKNOWN,
1000 CPU_AVX512VBMI_FLAGS, 0 },
1001 { STRING_COMMA_LEN (".avx512_4fmaps"), PROCESSOR_UNKNOWN,
1002 CPU_AVX512_4FMAPS_FLAGS, 0 },
1003 { STRING_COMMA_LEN (".avx512_4vnniw"), PROCESSOR_UNKNOWN,
1004 CPU_AVX512_4VNNIW_FLAGS, 0 },
1005 { STRING_COMMA_LEN (".avx512_vpopcntdq"), PROCESSOR_UNKNOWN,
1006 CPU_AVX512_VPOPCNTDQ_FLAGS, 0 },
1007 { STRING_COMMA_LEN (".avx512_vbmi2"), PROCESSOR_UNKNOWN,
1008 CPU_AVX512_VBMI2_FLAGS, 0 },
1009 { STRING_COMMA_LEN (".avx512_vnni"), PROCESSOR_UNKNOWN,
1010 CPU_AVX512_VNNI_FLAGS, 0 },
1011 { STRING_COMMA_LEN (".avx512_bitalg"), PROCESSOR_UNKNOWN,
1012 CPU_AVX512_BITALG_FLAGS, 0 },
1013 { STRING_COMMA_LEN (".clzero"), PROCESSOR_UNKNOWN,
1014 CPU_CLZERO_FLAGS, 0 },
1015 { STRING_COMMA_LEN (".mwaitx"), PROCESSOR_UNKNOWN,
1016 CPU_MWAITX_FLAGS, 0 },
1017 { STRING_COMMA_LEN (".ospke"), PROCESSOR_UNKNOWN,
1018 CPU_OSPKE_FLAGS, 0 },
1019 { STRING_COMMA_LEN (".rdpid"), PROCESSOR_UNKNOWN,
1020 CPU_RDPID_FLAGS, 0 },
1021 { STRING_COMMA_LEN (".ptwrite"), PROCESSOR_UNKNOWN,
1022 CPU_PTWRITE_FLAGS, 0 },
1023 { STRING_COMMA_LEN (".ibt"), PROCESSOR_UNKNOWN,
1024 CPU_IBT_FLAGS, 0 },
1025 { STRING_COMMA_LEN (".shstk"), PROCESSOR_UNKNOWN,
1026 CPU_SHSTK_FLAGS, 0 },
1027 { STRING_COMMA_LEN (".gfni"), PROCESSOR_UNKNOWN,
1028 CPU_GFNI_FLAGS, 0 },
1029 { STRING_COMMA_LEN (".vaes"), PROCESSOR_UNKNOWN,
1030 CPU_VAES_FLAGS, 0 },
1031 { STRING_COMMA_LEN (".vpclmulqdq"), PROCESSOR_UNKNOWN,
1032 CPU_VPCLMULQDQ_FLAGS, 0 },
1033 { STRING_COMMA_LEN (".wbnoinvd"), PROCESSOR_UNKNOWN,
1034 CPU_WBNOINVD_FLAGS, 0 },
1035 { STRING_COMMA_LEN (".pconfig"), PROCESSOR_UNKNOWN,
1036 CPU_PCONFIG_FLAGS, 0 },
1037 { STRING_COMMA_LEN (".waitpkg"), PROCESSOR_UNKNOWN,
1038 CPU_WAITPKG_FLAGS, 0 },
1039 { STRING_COMMA_LEN (".cldemote"), PROCESSOR_UNKNOWN,
1040 CPU_CLDEMOTE_FLAGS, 0 },
1041 { STRING_COMMA_LEN (".movdiri"), PROCESSOR_UNKNOWN,
1042 CPU_MOVDIRI_FLAGS, 0 },
1043 { STRING_COMMA_LEN (".movdir64b"), PROCESSOR_UNKNOWN,
1044 CPU_MOVDIR64B_FLAGS, 0 },
1045 };
1046
1047 static const noarch_entry cpu_noarch[] =
1048 {
1049 { STRING_COMMA_LEN ("no87"), CPU_ANY_X87_FLAGS },
1050 { STRING_COMMA_LEN ("no287"), CPU_ANY_287_FLAGS },
1051 { STRING_COMMA_LEN ("no387"), CPU_ANY_387_FLAGS },
1052 { STRING_COMMA_LEN ("no687"), CPU_ANY_687_FLAGS },
1053 { STRING_COMMA_LEN ("nocmov"), CPU_ANY_CMOV_FLAGS },
1054 { STRING_COMMA_LEN ("nofxsr"), CPU_ANY_FXSR_FLAGS },
1055 { STRING_COMMA_LEN ("nommx"), CPU_ANY_MMX_FLAGS },
1056 { STRING_COMMA_LEN ("nosse"), CPU_ANY_SSE_FLAGS },
1057 { STRING_COMMA_LEN ("nosse2"), CPU_ANY_SSE2_FLAGS },
1058 { STRING_COMMA_LEN ("nosse3"), CPU_ANY_SSE3_FLAGS },
1059 { STRING_COMMA_LEN ("nossse3"), CPU_ANY_SSSE3_FLAGS },
1060 { STRING_COMMA_LEN ("nosse4.1"), CPU_ANY_SSE4_1_FLAGS },
1061 { STRING_COMMA_LEN ("nosse4.2"), CPU_ANY_SSE4_2_FLAGS },
1062 { STRING_COMMA_LEN ("nosse4"), CPU_ANY_SSE4_1_FLAGS },
1063 { STRING_COMMA_LEN ("noavx"), CPU_ANY_AVX_FLAGS },
1064 { STRING_COMMA_LEN ("noavx2"), CPU_ANY_AVX2_FLAGS },
1065 { STRING_COMMA_LEN ("noavx512f"), CPU_ANY_AVX512F_FLAGS },
1066 { STRING_COMMA_LEN ("noavx512cd"), CPU_ANY_AVX512CD_FLAGS },
1067 { STRING_COMMA_LEN ("noavx512er"), CPU_ANY_AVX512ER_FLAGS },
1068 { STRING_COMMA_LEN ("noavx512pf"), CPU_ANY_AVX512PF_FLAGS },
1069 { STRING_COMMA_LEN ("noavx512dq"), CPU_ANY_AVX512DQ_FLAGS },
1070 { STRING_COMMA_LEN ("noavx512bw"), CPU_ANY_AVX512BW_FLAGS },
1071 { STRING_COMMA_LEN ("noavx512vl"), CPU_ANY_AVX512VL_FLAGS },
1072 { STRING_COMMA_LEN ("noavx512ifma"), CPU_ANY_AVX512IFMA_FLAGS },
1073 { STRING_COMMA_LEN ("noavx512vbmi"), CPU_ANY_AVX512VBMI_FLAGS },
1074 { STRING_COMMA_LEN ("noavx512_4fmaps"), CPU_ANY_AVX512_4FMAPS_FLAGS },
1075 { STRING_COMMA_LEN ("noavx512_4vnniw"), CPU_ANY_AVX512_4VNNIW_FLAGS },
1076 { STRING_COMMA_LEN ("noavx512_vpopcntdq"), CPU_ANY_AVX512_VPOPCNTDQ_FLAGS },
1077 { STRING_COMMA_LEN ("noavx512_vbmi2"), CPU_ANY_AVX512_VBMI2_FLAGS },
1078 { STRING_COMMA_LEN ("noavx512_vnni"), CPU_ANY_AVX512_VNNI_FLAGS },
1079 { STRING_COMMA_LEN ("noavx512_bitalg"), CPU_ANY_AVX512_BITALG_FLAGS },
1080 { STRING_COMMA_LEN ("noibt"), CPU_ANY_IBT_FLAGS },
1081 { STRING_COMMA_LEN ("noshstk"), CPU_ANY_SHSTK_FLAGS },
1082 { STRING_COMMA_LEN ("nomovdiri"), CPU_ANY_MOVDIRI_FLAGS },
1083 { STRING_COMMA_LEN ("nomovdir64b"), CPU_ANY_MOVDIR64B_FLAGS },
1084 };
1085
1086 #ifdef I386COFF
1087 /* Like s_lcomm_internal in gas/read.c but the alignment string
1088 is allowed to be optional. */
1089
1090 static symbolS *
1091 pe_lcomm_internal (int needs_align, symbolS *symbolP, addressT size)
1092 {
1093 addressT align = 0;
1094
1095 SKIP_WHITESPACE ();
1096
1097 if (needs_align
1098 && *input_line_pointer == ',')
1099 {
1100 align = parse_align (needs_align - 1);
1101
1102 if (align == (addressT) -1)
1103 return NULL;
1104 }
1105 else
1106 {
1107 if (size >= 8)
1108 align = 3;
1109 else if (size >= 4)
1110 align = 2;
1111 else if (size >= 2)
1112 align = 1;
1113 else
1114 align = 0;
1115 }
1116
1117 bss_alloc (symbolP, size, align);
1118 return symbolP;
1119 }
1120
1121 static void
1122 pe_lcomm (int needs_align)
1123 {
1124 s_comm_internal (needs_align * 2, pe_lcomm_internal);
1125 }
1126 #endif
1127
1128 const pseudo_typeS md_pseudo_table[] =
1129 {
1130 #if !defined(OBJ_AOUT) && !defined(USE_ALIGN_PTWO)
1131 {"align", s_align_bytes, 0},
1132 #else
1133 {"align", s_align_ptwo, 0},
1134 #endif
1135 {"arch", set_cpu_arch, 0},
1136 #ifndef I386COFF
1137 {"bss", s_bss, 0},
1138 #else
1139 {"lcomm", pe_lcomm, 1},
1140 #endif
1141 {"ffloat", float_cons, 'f'},
1142 {"dfloat", float_cons, 'd'},
1143 {"tfloat", float_cons, 'x'},
1144 {"value", cons, 2},
1145 {"slong", signed_cons, 4},
1146 {"noopt", s_ignore, 0},
1147 {"optim", s_ignore, 0},
1148 {"code16gcc", set_16bit_gcc_code_flag, CODE_16BIT},
1149 {"code16", set_code_flag, CODE_16BIT},
1150 {"code32", set_code_flag, CODE_32BIT},
1151 #ifdef BFD64
1152 {"code64", set_code_flag, CODE_64BIT},
1153 #endif
1154 {"intel_syntax", set_intel_syntax, 1},
1155 {"att_syntax", set_intel_syntax, 0},
1156 {"intel_mnemonic", set_intel_mnemonic, 1},
1157 {"att_mnemonic", set_intel_mnemonic, 0},
1158 {"allow_index_reg", set_allow_index_reg, 1},
1159 {"disallow_index_reg", set_allow_index_reg, 0},
1160 {"sse_check", set_check, 0},
1161 {"operand_check", set_check, 1},
1162 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
1163 {"largecomm", handle_large_common, 0},
1164 #else
1165 {"file", dwarf2_directive_file, 0},
1166 {"loc", dwarf2_directive_loc, 0},
1167 {"loc_mark_labels", dwarf2_directive_loc_mark_labels, 0},
1168 #endif
1169 #ifdef TE_PE
1170 {"secrel32", pe_directive_secrel, 0},
1171 #endif
1172 {0, 0, 0}
1173 };
1174
1175 /* For interface with expression (). */
1176 extern char *input_line_pointer;
1177
1178 /* Hash table for instruction mnemonic lookup. */
1179 static struct hash_control *op_hash;
1180
1181 /* Hash table for register lookup. */
1182 static struct hash_control *reg_hash;
1183 \f
1184 /* Various efficient no-op patterns for aligning code labels.
1185 Note: Don't try to assemble the instructions in the comments.
1186 0L and 0w are not legal. */
1187 static const unsigned char f32_1[] =
1188 {0x90}; /* nop */
1189 static const unsigned char f32_2[] =
1190 {0x66,0x90}; /* xchg %ax,%ax */
1191 static const unsigned char f32_3[] =
1192 {0x8d,0x76,0x00}; /* leal 0(%esi),%esi */
1193 static const unsigned char f32_4[] =
1194 {0x8d,0x74,0x26,0x00}; /* leal 0(%esi,1),%esi */
1195 static const unsigned char f32_6[] =
1196 {0x8d,0xb6,0x00,0x00,0x00,0x00}; /* leal 0L(%esi),%esi */
1197 static const unsigned char f32_7[] =
1198 {0x8d,0xb4,0x26,0x00,0x00,0x00,0x00}; /* leal 0L(%esi,1),%esi */
1199 static const unsigned char f16_3[] =
1200 {0x8d,0x74,0x00}; /* lea 0(%si),%si */
1201 static const unsigned char f16_4[] =
1202 {0x8d,0xb4,0x00,0x00}; /* lea 0W(%si),%si */
1203 static const unsigned char jump_disp8[] =
1204 {0xeb}; /* jmp disp8 */
1205 static const unsigned char jump32_disp32[] =
1206 {0xe9}; /* jmp disp32 */
1207 static const unsigned char jump16_disp32[] =
1208 {0x66,0xe9}; /* jmp disp32 */
1209 /* 32-bit NOPs patterns. */
1210 static const unsigned char *const f32_patt[] = {
1211 f32_1, f32_2, f32_3, f32_4, NULL, f32_6, f32_7
1212 };
1213 /* 16-bit NOPs patterns. */
1214 static const unsigned char *const f16_patt[] = {
1215 f32_1, f32_2, f16_3, f16_4
1216 };
1217 /* nopl (%[re]ax) */
1218 static const unsigned char alt_3[] =
1219 {0x0f,0x1f,0x00};
1220 /* nopl 0(%[re]ax) */
1221 static const unsigned char alt_4[] =
1222 {0x0f,0x1f,0x40,0x00};
1223 /* nopl 0(%[re]ax,%[re]ax,1) */
1224 static const unsigned char alt_5[] =
1225 {0x0f,0x1f,0x44,0x00,0x00};
1226 /* nopw 0(%[re]ax,%[re]ax,1) */
1227 static const unsigned char alt_6[] =
1228 {0x66,0x0f,0x1f,0x44,0x00,0x00};
1229 /* nopl 0L(%[re]ax) */
1230 static const unsigned char alt_7[] =
1231 {0x0f,0x1f,0x80,0x00,0x00,0x00,0x00};
1232 /* nopl 0L(%[re]ax,%[re]ax,1) */
1233 static const unsigned char alt_8[] =
1234 {0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1235 /* nopw 0L(%[re]ax,%[re]ax,1) */
1236 static const unsigned char alt_9[] =
1237 {0x66,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1238 /* nopw %cs:0L(%[re]ax,%[re]ax,1) */
1239 static const unsigned char alt_10[] =
1240 {0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1241 /* data16 nopw %cs:0L(%eax,%eax,1) */
1242 static const unsigned char alt_11[] =
1243 {0x66,0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1244 /* 32-bit and 64-bit NOPs patterns. */
1245 static const unsigned char *const alt_patt[] = {
1246 f32_1, f32_2, alt_3, alt_4, alt_5, alt_6, alt_7, alt_8,
1247 alt_9, alt_10, alt_11
1248 };
1249
1250 /* Genenerate COUNT bytes of NOPs to WHERE from PATT with the maximum
1251 size of a single NOP instruction MAX_SINGLE_NOP_SIZE. */
1252
1253 static void
1254 i386_output_nops (char *where, const unsigned char *const *patt,
1255 int count, int max_single_nop_size)
1256
1257 {
1258 /* Place the longer NOP first. */
1259 int last;
1260 int offset;
1261 const unsigned char *nops = patt[max_single_nop_size - 1];
1262
1263 /* Use the smaller one if the requsted one isn't available. */
1264 if (nops == NULL)
1265 {
1266 max_single_nop_size--;
1267 nops = patt[max_single_nop_size - 1];
1268 }
1269
1270 last = count % max_single_nop_size;
1271
1272 count -= last;
1273 for (offset = 0; offset < count; offset += max_single_nop_size)
1274 memcpy (where + offset, nops, max_single_nop_size);
1275
1276 if (last)
1277 {
1278 nops = patt[last - 1];
1279 if (nops == NULL)
1280 {
1281 /* Use the smaller one plus one-byte NOP if the needed one
1282 isn't available. */
1283 last--;
1284 nops = patt[last - 1];
1285 memcpy (where + offset, nops, last);
1286 where[offset + last] = *patt[0];
1287 }
1288 else
1289 memcpy (where + offset, nops, last);
1290 }
1291 }
1292
1293 static INLINE int
1294 fits_in_imm7 (offsetT num)
1295 {
1296 return (num & 0x7f) == num;
1297 }
1298
1299 static INLINE int
1300 fits_in_imm31 (offsetT num)
1301 {
1302 return (num & 0x7fffffff) == num;
1303 }
1304
1305 /* Genenerate COUNT bytes of NOPs to WHERE with the maximum size of a
1306 single NOP instruction LIMIT. */
1307
1308 void
1309 i386_generate_nops (fragS *fragP, char *where, offsetT count, int limit)
1310 {
1311 const unsigned char *const *patt = NULL;
1312 int max_single_nop_size;
1313 /* Maximum number of NOPs before switching to jump over NOPs. */
1314 int max_number_of_nops;
1315
1316 switch (fragP->fr_type)
1317 {
1318 case rs_fill_nop:
1319 case rs_align_code:
1320 break;
1321 default:
1322 return;
1323 }
1324
1325 /* We need to decide which NOP sequence to use for 32bit and
1326 64bit. When -mtune= is used:
1327
1328 1. For PROCESSOR_I386, PROCESSOR_I486, PROCESSOR_PENTIUM and
1329 PROCESSOR_GENERIC32, f32_patt will be used.
1330 2. For the rest, alt_patt will be used.
1331
1332 When -mtune= isn't used, alt_patt will be used if
1333 cpu_arch_isa_flags has CpuNop. Otherwise, f32_patt will
1334 be used.
1335
1336 When -march= or .arch is used, we can't use anything beyond
1337 cpu_arch_isa_flags. */
1338
1339 if (flag_code == CODE_16BIT)
1340 {
1341 patt = f16_patt;
1342 max_single_nop_size = sizeof (f16_patt) / sizeof (f16_patt[0]);
1343 /* Limit number of NOPs to 2 in 16-bit mode. */
1344 max_number_of_nops = 2;
1345 }
1346 else
1347 {
1348 if (fragP->tc_frag_data.isa == PROCESSOR_UNKNOWN)
1349 {
1350 /* PROCESSOR_UNKNOWN means that all ISAs may be used. */
1351 switch (cpu_arch_tune)
1352 {
1353 case PROCESSOR_UNKNOWN:
1354 /* We use cpu_arch_isa_flags to check if we SHOULD
1355 optimize with nops. */
1356 if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1357 patt = alt_patt;
1358 else
1359 patt = f32_patt;
1360 break;
1361 case PROCESSOR_PENTIUM4:
1362 case PROCESSOR_NOCONA:
1363 case PROCESSOR_CORE:
1364 case PROCESSOR_CORE2:
1365 case PROCESSOR_COREI7:
1366 case PROCESSOR_L1OM:
1367 case PROCESSOR_K1OM:
1368 case PROCESSOR_GENERIC64:
1369 case PROCESSOR_K6:
1370 case PROCESSOR_ATHLON:
1371 case PROCESSOR_K8:
1372 case PROCESSOR_AMDFAM10:
1373 case PROCESSOR_BD:
1374 case PROCESSOR_ZNVER:
1375 case PROCESSOR_BT:
1376 patt = alt_patt;
1377 break;
1378 case PROCESSOR_I386:
1379 case PROCESSOR_I486:
1380 case PROCESSOR_PENTIUM:
1381 case PROCESSOR_PENTIUMPRO:
1382 case PROCESSOR_IAMCU:
1383 case PROCESSOR_GENERIC32:
1384 patt = f32_patt;
1385 break;
1386 }
1387 }
1388 else
1389 {
1390 switch (fragP->tc_frag_data.tune)
1391 {
1392 case PROCESSOR_UNKNOWN:
1393 /* When cpu_arch_isa is set, cpu_arch_tune shouldn't be
1394 PROCESSOR_UNKNOWN. */
1395 abort ();
1396 break;
1397
1398 case PROCESSOR_I386:
1399 case PROCESSOR_I486:
1400 case PROCESSOR_PENTIUM:
1401 case PROCESSOR_IAMCU:
1402 case PROCESSOR_K6:
1403 case PROCESSOR_ATHLON:
1404 case PROCESSOR_K8:
1405 case PROCESSOR_AMDFAM10:
1406 case PROCESSOR_BD:
1407 case PROCESSOR_ZNVER:
1408 case PROCESSOR_BT:
1409 case PROCESSOR_GENERIC32:
1410 /* We use cpu_arch_isa_flags to check if we CAN optimize
1411 with nops. */
1412 if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1413 patt = alt_patt;
1414 else
1415 patt = f32_patt;
1416 break;
1417 case PROCESSOR_PENTIUMPRO:
1418 case PROCESSOR_PENTIUM4:
1419 case PROCESSOR_NOCONA:
1420 case PROCESSOR_CORE:
1421 case PROCESSOR_CORE2:
1422 case PROCESSOR_COREI7:
1423 case PROCESSOR_L1OM:
1424 case PROCESSOR_K1OM:
1425 if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1426 patt = alt_patt;
1427 else
1428 patt = f32_patt;
1429 break;
1430 case PROCESSOR_GENERIC64:
1431 patt = alt_patt;
1432 break;
1433 }
1434 }
1435
1436 if (patt == f32_patt)
1437 {
1438 max_single_nop_size = sizeof (f32_patt) / sizeof (f32_patt[0]);
1439 /* Limit number of NOPs to 2 for older processors. */
1440 max_number_of_nops = 2;
1441 }
1442 else
1443 {
1444 max_single_nop_size = sizeof (alt_patt) / sizeof (alt_patt[0]);
1445 /* Limit number of NOPs to 7 for newer processors. */
1446 max_number_of_nops = 7;
1447 }
1448 }
1449
1450 if (limit == 0)
1451 limit = max_single_nop_size;
1452
1453 if (fragP->fr_type == rs_fill_nop)
1454 {
1455 /* Output NOPs for .nop directive. */
1456 if (limit > max_single_nop_size)
1457 {
1458 as_bad_where (fragP->fr_file, fragP->fr_line,
1459 _("invalid single nop size: %d "
1460 "(expect within [0, %d])"),
1461 limit, max_single_nop_size);
1462 return;
1463 }
1464 }
1465 else
1466 fragP->fr_var = count;
1467
1468 if ((count / max_single_nop_size) > max_number_of_nops)
1469 {
1470 /* Generate jump over NOPs. */
1471 offsetT disp = count - 2;
1472 if (fits_in_imm7 (disp))
1473 {
1474 /* Use "jmp disp8" if possible. */
1475 count = disp;
1476 where[0] = jump_disp8[0];
1477 where[1] = count;
1478 where += 2;
1479 }
1480 else
1481 {
1482 unsigned int size_of_jump;
1483
1484 if (flag_code == CODE_16BIT)
1485 {
1486 where[0] = jump16_disp32[0];
1487 where[1] = jump16_disp32[1];
1488 size_of_jump = 2;
1489 }
1490 else
1491 {
1492 where[0] = jump32_disp32[0];
1493 size_of_jump = 1;
1494 }
1495
1496 count -= size_of_jump + 4;
1497 if (!fits_in_imm31 (count))
1498 {
1499 as_bad_where (fragP->fr_file, fragP->fr_line,
1500 _("jump over nop padding out of range"));
1501 return;
1502 }
1503
1504 md_number_to_chars (where + size_of_jump, count, 4);
1505 where += size_of_jump + 4;
1506 }
1507 }
1508
1509 /* Generate multiple NOPs. */
1510 i386_output_nops (where, patt, count, limit);
1511 }
1512
1513 static INLINE int
1514 operand_type_all_zero (const union i386_operand_type *x)
1515 {
1516 switch (ARRAY_SIZE(x->array))
1517 {
1518 case 3:
1519 if (x->array[2])
1520 return 0;
1521 /* Fall through. */
1522 case 2:
1523 if (x->array[1])
1524 return 0;
1525 /* Fall through. */
1526 case 1:
1527 return !x->array[0];
1528 default:
1529 abort ();
1530 }
1531 }
1532
1533 static INLINE void
1534 operand_type_set (union i386_operand_type *x, unsigned int v)
1535 {
1536 switch (ARRAY_SIZE(x->array))
1537 {
1538 case 3:
1539 x->array[2] = v;
1540 /* Fall through. */
1541 case 2:
1542 x->array[1] = v;
1543 /* Fall through. */
1544 case 1:
1545 x->array[0] = v;
1546 /* Fall through. */
1547 break;
1548 default:
1549 abort ();
1550 }
1551 }
1552
1553 static INLINE int
1554 operand_type_equal (const union i386_operand_type *x,
1555 const union i386_operand_type *y)
1556 {
1557 switch (ARRAY_SIZE(x->array))
1558 {
1559 case 3:
1560 if (x->array[2] != y->array[2])
1561 return 0;
1562 /* Fall through. */
1563 case 2:
1564 if (x->array[1] != y->array[1])
1565 return 0;
1566 /* Fall through. */
1567 case 1:
1568 return x->array[0] == y->array[0];
1569 break;
1570 default:
1571 abort ();
1572 }
1573 }
1574
1575 static INLINE int
1576 cpu_flags_all_zero (const union i386_cpu_flags *x)
1577 {
1578 switch (ARRAY_SIZE(x->array))
1579 {
1580 case 4:
1581 if (x->array[3])
1582 return 0;
1583 /* Fall through. */
1584 case 3:
1585 if (x->array[2])
1586 return 0;
1587 /* Fall through. */
1588 case 2:
1589 if (x->array[1])
1590 return 0;
1591 /* Fall through. */
1592 case 1:
1593 return !x->array[0];
1594 default:
1595 abort ();
1596 }
1597 }
1598
1599 static INLINE int
1600 cpu_flags_equal (const union i386_cpu_flags *x,
1601 const union i386_cpu_flags *y)
1602 {
1603 switch (ARRAY_SIZE(x->array))
1604 {
1605 case 4:
1606 if (x->array[3] != y->array[3])
1607 return 0;
1608 /* Fall through. */
1609 case 3:
1610 if (x->array[2] != y->array[2])
1611 return 0;
1612 /* Fall through. */
1613 case 2:
1614 if (x->array[1] != y->array[1])
1615 return 0;
1616 /* Fall through. */
1617 case 1:
1618 return x->array[0] == y->array[0];
1619 break;
1620 default:
1621 abort ();
1622 }
1623 }
1624
1625 static INLINE int
1626 cpu_flags_check_cpu64 (i386_cpu_flags f)
1627 {
1628 return !((flag_code == CODE_64BIT && f.bitfield.cpuno64)
1629 || (flag_code != CODE_64BIT && f.bitfield.cpu64));
1630 }
1631
1632 static INLINE i386_cpu_flags
1633 cpu_flags_and (i386_cpu_flags x, i386_cpu_flags y)
1634 {
1635 switch (ARRAY_SIZE (x.array))
1636 {
1637 case 4:
1638 x.array [3] &= y.array [3];
1639 /* Fall through. */
1640 case 3:
1641 x.array [2] &= y.array [2];
1642 /* Fall through. */
1643 case 2:
1644 x.array [1] &= y.array [1];
1645 /* Fall through. */
1646 case 1:
1647 x.array [0] &= y.array [0];
1648 break;
1649 default:
1650 abort ();
1651 }
1652 return x;
1653 }
1654
1655 static INLINE i386_cpu_flags
1656 cpu_flags_or (i386_cpu_flags x, i386_cpu_flags y)
1657 {
1658 switch (ARRAY_SIZE (x.array))
1659 {
1660 case 4:
1661 x.array [3] |= y.array [3];
1662 /* Fall through. */
1663 case 3:
1664 x.array [2] |= y.array [2];
1665 /* Fall through. */
1666 case 2:
1667 x.array [1] |= y.array [1];
1668 /* Fall through. */
1669 case 1:
1670 x.array [0] |= y.array [0];
1671 break;
1672 default:
1673 abort ();
1674 }
1675 return x;
1676 }
1677
1678 static INLINE i386_cpu_flags
1679 cpu_flags_and_not (i386_cpu_flags x, i386_cpu_flags y)
1680 {
1681 switch (ARRAY_SIZE (x.array))
1682 {
1683 case 4:
1684 x.array [3] &= ~y.array [3];
1685 /* Fall through. */
1686 case 3:
1687 x.array [2] &= ~y.array [2];
1688 /* Fall through. */
1689 case 2:
1690 x.array [1] &= ~y.array [1];
1691 /* Fall through. */
1692 case 1:
1693 x.array [0] &= ~y.array [0];
1694 break;
1695 default:
1696 abort ();
1697 }
1698 return x;
1699 }
1700
1701 #define CPU_FLAGS_ARCH_MATCH 0x1
1702 #define CPU_FLAGS_64BIT_MATCH 0x2
1703
1704 #define CPU_FLAGS_PERFECT_MATCH \
1705 (CPU_FLAGS_ARCH_MATCH | CPU_FLAGS_64BIT_MATCH)
1706
1707 /* Return CPU flags match bits. */
1708
1709 static int
1710 cpu_flags_match (const insn_template *t)
1711 {
1712 i386_cpu_flags x = t->cpu_flags;
1713 int match = cpu_flags_check_cpu64 (x) ? CPU_FLAGS_64BIT_MATCH : 0;
1714
1715 x.bitfield.cpu64 = 0;
1716 x.bitfield.cpuno64 = 0;
1717
1718 if (cpu_flags_all_zero (&x))
1719 {
1720 /* This instruction is available on all archs. */
1721 match |= CPU_FLAGS_ARCH_MATCH;
1722 }
1723 else
1724 {
1725 /* This instruction is available only on some archs. */
1726 i386_cpu_flags cpu = cpu_arch_flags;
1727
1728 /* AVX512VL is no standalone feature - match it and then strip it. */
1729 if (x.bitfield.cpuavx512vl && !cpu.bitfield.cpuavx512vl)
1730 return match;
1731 x.bitfield.cpuavx512vl = 0;
1732
1733 cpu = cpu_flags_and (x, cpu);
1734 if (!cpu_flags_all_zero (&cpu))
1735 {
1736 if (x.bitfield.cpuavx)
1737 {
1738 /* We need to check a few extra flags with AVX. */
1739 if (cpu.bitfield.cpuavx
1740 && (!t->opcode_modifier.sse2avx || sse2avx)
1741 && (!x.bitfield.cpuaes || cpu.bitfield.cpuaes)
1742 && (!x.bitfield.cpugfni || cpu.bitfield.cpugfni)
1743 && (!x.bitfield.cpupclmul || cpu.bitfield.cpupclmul))
1744 match |= CPU_FLAGS_ARCH_MATCH;
1745 }
1746 else if (x.bitfield.cpuavx512f)
1747 {
1748 /* We need to check a few extra flags with AVX512F. */
1749 if (cpu.bitfield.cpuavx512f
1750 && (!x.bitfield.cpugfni || cpu.bitfield.cpugfni)
1751 && (!x.bitfield.cpuvaes || cpu.bitfield.cpuvaes)
1752 && (!x.bitfield.cpuvpclmulqdq || cpu.bitfield.cpuvpclmulqdq))
1753 match |= CPU_FLAGS_ARCH_MATCH;
1754 }
1755 else
1756 match |= CPU_FLAGS_ARCH_MATCH;
1757 }
1758 }
1759 return match;
1760 }
1761
1762 static INLINE i386_operand_type
1763 operand_type_and (i386_operand_type x, i386_operand_type y)
1764 {
1765 switch (ARRAY_SIZE (x.array))
1766 {
1767 case 3:
1768 x.array [2] &= y.array [2];
1769 /* Fall through. */
1770 case 2:
1771 x.array [1] &= y.array [1];
1772 /* Fall through. */
1773 case 1:
1774 x.array [0] &= y.array [0];
1775 break;
1776 default:
1777 abort ();
1778 }
1779 return x;
1780 }
1781
1782 static INLINE i386_operand_type
1783 operand_type_and_not (i386_operand_type x, i386_operand_type y)
1784 {
1785 switch (ARRAY_SIZE (x.array))
1786 {
1787 case 3:
1788 x.array [2] &= ~y.array [2];
1789 /* Fall through. */
1790 case 2:
1791 x.array [1] &= ~y.array [1];
1792 /* Fall through. */
1793 case 1:
1794 x.array [0] &= ~y.array [0];
1795 break;
1796 default:
1797 abort ();
1798 }
1799 return x;
1800 }
1801
1802 static INLINE i386_operand_type
1803 operand_type_or (i386_operand_type x, i386_operand_type y)
1804 {
1805 switch (ARRAY_SIZE (x.array))
1806 {
1807 case 3:
1808 x.array [2] |= y.array [2];
1809 /* Fall through. */
1810 case 2:
1811 x.array [1] |= y.array [1];
1812 /* Fall through. */
1813 case 1:
1814 x.array [0] |= y.array [0];
1815 break;
1816 default:
1817 abort ();
1818 }
1819 return x;
1820 }
1821
1822 static INLINE i386_operand_type
1823 operand_type_xor (i386_operand_type x, i386_operand_type y)
1824 {
1825 switch (ARRAY_SIZE (x.array))
1826 {
1827 case 3:
1828 x.array [2] ^= y.array [2];
1829 /* Fall through. */
1830 case 2:
1831 x.array [1] ^= y.array [1];
1832 /* Fall through. */
1833 case 1:
1834 x.array [0] ^= y.array [0];
1835 break;
1836 default:
1837 abort ();
1838 }
1839 return x;
1840 }
1841
1842 static const i386_operand_type acc32 = OPERAND_TYPE_ACC32;
1843 static const i386_operand_type acc64 = OPERAND_TYPE_ACC64;
1844 static const i386_operand_type disp16 = OPERAND_TYPE_DISP16;
1845 static const i386_operand_type disp32 = OPERAND_TYPE_DISP32;
1846 static const i386_operand_type disp32s = OPERAND_TYPE_DISP32S;
1847 static const i386_operand_type disp16_32 = OPERAND_TYPE_DISP16_32;
1848 static const i386_operand_type anydisp
1849 = OPERAND_TYPE_ANYDISP;
1850 static const i386_operand_type regxmm = OPERAND_TYPE_REGXMM;
1851 static const i386_operand_type regmask = OPERAND_TYPE_REGMASK;
1852 static const i386_operand_type imm8 = OPERAND_TYPE_IMM8;
1853 static const i386_operand_type imm8s = OPERAND_TYPE_IMM8S;
1854 static const i386_operand_type imm16 = OPERAND_TYPE_IMM16;
1855 static const i386_operand_type imm32 = OPERAND_TYPE_IMM32;
1856 static const i386_operand_type imm32s = OPERAND_TYPE_IMM32S;
1857 static const i386_operand_type imm64 = OPERAND_TYPE_IMM64;
1858 static const i386_operand_type imm16_32 = OPERAND_TYPE_IMM16_32;
1859 static const i386_operand_type imm16_32s = OPERAND_TYPE_IMM16_32S;
1860 static const i386_operand_type imm16_32_32s = OPERAND_TYPE_IMM16_32_32S;
1861 static const i386_operand_type vec_imm4 = OPERAND_TYPE_VEC_IMM4;
1862
1863 enum operand_type
1864 {
1865 reg,
1866 imm,
1867 disp,
1868 anymem
1869 };
1870
1871 static INLINE int
1872 operand_type_check (i386_operand_type t, enum operand_type c)
1873 {
1874 switch (c)
1875 {
1876 case reg:
1877 return t.bitfield.reg;
1878
1879 case imm:
1880 return (t.bitfield.imm8
1881 || t.bitfield.imm8s
1882 || t.bitfield.imm16
1883 || t.bitfield.imm32
1884 || t.bitfield.imm32s
1885 || t.bitfield.imm64);
1886
1887 case disp:
1888 return (t.bitfield.disp8
1889 || t.bitfield.disp16
1890 || t.bitfield.disp32
1891 || t.bitfield.disp32s
1892 || t.bitfield.disp64);
1893
1894 case anymem:
1895 return (t.bitfield.disp8
1896 || t.bitfield.disp16
1897 || t.bitfield.disp32
1898 || t.bitfield.disp32s
1899 || t.bitfield.disp64
1900 || t.bitfield.baseindex);
1901
1902 default:
1903 abort ();
1904 }
1905
1906 return 0;
1907 }
1908
1909 /* Return 1 if there is no conflict in 8bit/16bit/32bit/64bit/80bit size
1910 between operand GIVEN and opeand WANTED for instruction template T. */
1911
1912 static INLINE int
1913 match_operand_size (const insn_template *t, unsigned int wanted,
1914 unsigned int given)
1915 {
1916 return !((i.types[given].bitfield.byte
1917 && !t->operand_types[wanted].bitfield.byte)
1918 || (i.types[given].bitfield.word
1919 && !t->operand_types[wanted].bitfield.word)
1920 || (i.types[given].bitfield.dword
1921 && !t->operand_types[wanted].bitfield.dword)
1922 || (i.types[given].bitfield.qword
1923 && !t->operand_types[wanted].bitfield.qword)
1924 || (i.types[given].bitfield.tbyte
1925 && !t->operand_types[wanted].bitfield.tbyte));
1926 }
1927
1928 /* Return 1 if there is no conflict in SIMD register between operand
1929 GIVEN and opeand WANTED for instruction template T. */
1930
1931 static INLINE int
1932 match_simd_size (const insn_template *t, unsigned int wanted,
1933 unsigned int given)
1934 {
1935 return !((i.types[given].bitfield.xmmword
1936 && !t->operand_types[wanted].bitfield.xmmword)
1937 || (i.types[given].bitfield.ymmword
1938 && !t->operand_types[wanted].bitfield.ymmword)
1939 || (i.types[given].bitfield.zmmword
1940 && !t->operand_types[wanted].bitfield.zmmword));
1941 }
1942
1943 /* Return 1 if there is no conflict in any size between operand GIVEN
1944 and opeand WANTED for instruction template T. */
1945
1946 static INLINE int
1947 match_mem_size (const insn_template *t, unsigned int wanted,
1948 unsigned int given)
1949 {
1950 return (match_operand_size (t, wanted, given)
1951 && !((i.types[given].bitfield.unspecified
1952 && !i.broadcast
1953 && !t->operand_types[wanted].bitfield.unspecified)
1954 || (i.types[given].bitfield.fword
1955 && !t->operand_types[wanted].bitfield.fword)
1956 /* For scalar opcode templates to allow register and memory
1957 operands at the same time, some special casing is needed
1958 here. Also for v{,p}broadcast*, {,v}pmov{s,z}*, and
1959 down-conversion vpmov*. */
1960 || ((t->operand_types[wanted].bitfield.regsimd
1961 && !t->opcode_modifier.broadcast
1962 && (t->operand_types[wanted].bitfield.byte
1963 || t->operand_types[wanted].bitfield.word
1964 || t->operand_types[wanted].bitfield.dword
1965 || t->operand_types[wanted].bitfield.qword))
1966 ? (i.types[given].bitfield.xmmword
1967 || i.types[given].bitfield.ymmword
1968 || i.types[given].bitfield.zmmword)
1969 : !match_simd_size(t, wanted, given))));
1970 }
1971
1972 /* Return value has MATCH_STRAIGHT set if there is no size conflict on any
1973 operands for instruction template T, and it has MATCH_REVERSE set if there
1974 is no size conflict on any operands for the template with operands reversed
1975 (and the template allows for reversing in the first place). */
1976
1977 #define MATCH_STRAIGHT 1
1978 #define MATCH_REVERSE 2
1979
1980 static INLINE unsigned int
1981 operand_size_match (const insn_template *t)
1982 {
1983 unsigned int j, match = MATCH_STRAIGHT;
1984
1985 /* Don't check jump instructions. */
1986 if (t->opcode_modifier.jump
1987 || t->opcode_modifier.jumpbyte
1988 || t->opcode_modifier.jumpdword
1989 || t->opcode_modifier.jumpintersegment)
1990 return match;
1991
1992 /* Check memory and accumulator operand size. */
1993 for (j = 0; j < i.operands; j++)
1994 {
1995 if (!i.types[j].bitfield.reg && !i.types[j].bitfield.regsimd
1996 && t->operand_types[j].bitfield.anysize)
1997 continue;
1998
1999 if (t->operand_types[j].bitfield.reg
2000 && !match_operand_size (t, j, j))
2001 {
2002 match = 0;
2003 break;
2004 }
2005
2006 if (t->operand_types[j].bitfield.regsimd
2007 && !match_simd_size (t, j, j))
2008 {
2009 match = 0;
2010 break;
2011 }
2012
2013 if (t->operand_types[j].bitfield.acc
2014 && (!match_operand_size (t, j, j) || !match_simd_size (t, j, j)))
2015 {
2016 match = 0;
2017 break;
2018 }
2019
2020 if ((i.flags[j] & Operand_Mem) && !match_mem_size (t, j, j))
2021 {
2022 match = 0;
2023 break;
2024 }
2025 }
2026
2027 if (!t->opcode_modifier.d)
2028 {
2029 mismatch:
2030 if (!match)
2031 i.error = operand_size_mismatch;
2032 return match;
2033 }
2034
2035 /* Check reverse. */
2036 gas_assert (i.operands == 2);
2037
2038 for (j = 0; j < 2; j++)
2039 {
2040 if ((t->operand_types[j].bitfield.reg
2041 || t->operand_types[j].bitfield.acc)
2042 && !match_operand_size (t, j, !j))
2043 goto mismatch;
2044
2045 if ((i.flags[!j] & Operand_Mem) && !match_mem_size (t, j, !j))
2046 goto mismatch;
2047 }
2048
2049 return match | MATCH_REVERSE;
2050 }
2051
2052 static INLINE int
2053 operand_type_match (i386_operand_type overlap,
2054 i386_operand_type given)
2055 {
2056 i386_operand_type temp = overlap;
2057
2058 temp.bitfield.jumpabsolute = 0;
2059 temp.bitfield.unspecified = 0;
2060 temp.bitfield.byte = 0;
2061 temp.bitfield.word = 0;
2062 temp.bitfield.dword = 0;
2063 temp.bitfield.fword = 0;
2064 temp.bitfield.qword = 0;
2065 temp.bitfield.tbyte = 0;
2066 temp.bitfield.xmmword = 0;
2067 temp.bitfield.ymmword = 0;
2068 temp.bitfield.zmmword = 0;
2069 if (operand_type_all_zero (&temp))
2070 goto mismatch;
2071
2072 if (given.bitfield.baseindex == overlap.bitfield.baseindex
2073 && given.bitfield.jumpabsolute == overlap.bitfield.jumpabsolute)
2074 return 1;
2075
2076 mismatch:
2077 i.error = operand_type_mismatch;
2078 return 0;
2079 }
2080
2081 /* If given types g0 and g1 are registers they must be of the same type
2082 unless the expected operand type register overlap is null.
2083 Memory operand size of certain SIMD instructions is also being checked
2084 here. */
2085
2086 static INLINE int
2087 operand_type_register_match (i386_operand_type g0,
2088 i386_operand_type t0,
2089 i386_operand_type g1,
2090 i386_operand_type t1)
2091 {
2092 if (!g0.bitfield.reg
2093 && !g0.bitfield.regsimd
2094 && (!operand_type_check (g0, anymem)
2095 || g0.bitfield.unspecified
2096 || !t0.bitfield.regsimd))
2097 return 1;
2098
2099 if (!g1.bitfield.reg
2100 && !g1.bitfield.regsimd
2101 && (!operand_type_check (g1, anymem)
2102 || g1.bitfield.unspecified
2103 || !t1.bitfield.regsimd))
2104 return 1;
2105
2106 if (g0.bitfield.byte == g1.bitfield.byte
2107 && g0.bitfield.word == g1.bitfield.word
2108 && g0.bitfield.dword == g1.bitfield.dword
2109 && g0.bitfield.qword == g1.bitfield.qword
2110 && g0.bitfield.xmmword == g1.bitfield.xmmword
2111 && g0.bitfield.ymmword == g1.bitfield.ymmword
2112 && g0.bitfield.zmmword == g1.bitfield.zmmword)
2113 return 1;
2114
2115 if (!(t0.bitfield.byte & t1.bitfield.byte)
2116 && !(t0.bitfield.word & t1.bitfield.word)
2117 && !(t0.bitfield.dword & t1.bitfield.dword)
2118 && !(t0.bitfield.qword & t1.bitfield.qword)
2119 && !(t0.bitfield.xmmword & t1.bitfield.xmmword)
2120 && !(t0.bitfield.ymmword & t1.bitfield.ymmword)
2121 && !(t0.bitfield.zmmword & t1.bitfield.zmmword))
2122 return 1;
2123
2124 i.error = register_type_mismatch;
2125
2126 return 0;
2127 }
2128
2129 static INLINE unsigned int
2130 register_number (const reg_entry *r)
2131 {
2132 unsigned int nr = r->reg_num;
2133
2134 if (r->reg_flags & RegRex)
2135 nr += 8;
2136
2137 if (r->reg_flags & RegVRex)
2138 nr += 16;
2139
2140 return nr;
2141 }
2142
2143 static INLINE unsigned int
2144 mode_from_disp_size (i386_operand_type t)
2145 {
2146 if (t.bitfield.disp8)
2147 return 1;
2148 else if (t.bitfield.disp16
2149 || t.bitfield.disp32
2150 || t.bitfield.disp32s)
2151 return 2;
2152 else
2153 return 0;
2154 }
2155
2156 static INLINE int
2157 fits_in_signed_byte (addressT num)
2158 {
2159 return num + 0x80 <= 0xff;
2160 }
2161
2162 static INLINE int
2163 fits_in_unsigned_byte (addressT num)
2164 {
2165 return num <= 0xff;
2166 }
2167
2168 static INLINE int
2169 fits_in_unsigned_word (addressT num)
2170 {
2171 return num <= 0xffff;
2172 }
2173
2174 static INLINE int
2175 fits_in_signed_word (addressT num)
2176 {
2177 return num + 0x8000 <= 0xffff;
2178 }
2179
2180 static INLINE int
2181 fits_in_signed_long (addressT num ATTRIBUTE_UNUSED)
2182 {
2183 #ifndef BFD64
2184 return 1;
2185 #else
2186 return num + 0x80000000 <= 0xffffffff;
2187 #endif
2188 } /* fits_in_signed_long() */
2189
2190 static INLINE int
2191 fits_in_unsigned_long (addressT num ATTRIBUTE_UNUSED)
2192 {
2193 #ifndef BFD64
2194 return 1;
2195 #else
2196 return num <= 0xffffffff;
2197 #endif
2198 } /* fits_in_unsigned_long() */
2199
2200 static INLINE int
2201 fits_in_disp8 (offsetT num)
2202 {
2203 int shift = i.memshift;
2204 unsigned int mask;
2205
2206 if (shift == -1)
2207 abort ();
2208
2209 mask = (1 << shift) - 1;
2210
2211 /* Return 0 if NUM isn't properly aligned. */
2212 if ((num & mask))
2213 return 0;
2214
2215 /* Check if NUM will fit in 8bit after shift. */
2216 return fits_in_signed_byte (num >> shift);
2217 }
2218
2219 static INLINE int
2220 fits_in_imm4 (offsetT num)
2221 {
2222 return (num & 0xf) == num;
2223 }
2224
2225 static i386_operand_type
2226 smallest_imm_type (offsetT num)
2227 {
2228 i386_operand_type t;
2229
2230 operand_type_set (&t, 0);
2231 t.bitfield.imm64 = 1;
2232
2233 if (cpu_arch_tune != PROCESSOR_I486 && num == 1)
2234 {
2235 /* This code is disabled on the 486 because all the Imm1 forms
2236 in the opcode table are slower on the i486. They're the
2237 versions with the implicitly specified single-position
2238 displacement, which has another syntax if you really want to
2239 use that form. */
2240 t.bitfield.imm1 = 1;
2241 t.bitfield.imm8 = 1;
2242 t.bitfield.imm8s = 1;
2243 t.bitfield.imm16 = 1;
2244 t.bitfield.imm32 = 1;
2245 t.bitfield.imm32s = 1;
2246 }
2247 else if (fits_in_signed_byte (num))
2248 {
2249 t.bitfield.imm8 = 1;
2250 t.bitfield.imm8s = 1;
2251 t.bitfield.imm16 = 1;
2252 t.bitfield.imm32 = 1;
2253 t.bitfield.imm32s = 1;
2254 }
2255 else if (fits_in_unsigned_byte (num))
2256 {
2257 t.bitfield.imm8 = 1;
2258 t.bitfield.imm16 = 1;
2259 t.bitfield.imm32 = 1;
2260 t.bitfield.imm32s = 1;
2261 }
2262 else if (fits_in_signed_word (num) || fits_in_unsigned_word (num))
2263 {
2264 t.bitfield.imm16 = 1;
2265 t.bitfield.imm32 = 1;
2266 t.bitfield.imm32s = 1;
2267 }
2268 else if (fits_in_signed_long (num))
2269 {
2270 t.bitfield.imm32 = 1;
2271 t.bitfield.imm32s = 1;
2272 }
2273 else if (fits_in_unsigned_long (num))
2274 t.bitfield.imm32 = 1;
2275
2276 return t;
2277 }
2278
2279 static offsetT
2280 offset_in_range (offsetT val, int size)
2281 {
2282 addressT mask;
2283
2284 switch (size)
2285 {
2286 case 1: mask = ((addressT) 1 << 8) - 1; break;
2287 case 2: mask = ((addressT) 1 << 16) - 1; break;
2288 case 4: mask = ((addressT) 2 << 31) - 1; break;
2289 #ifdef BFD64
2290 case 8: mask = ((addressT) 2 << 63) - 1; break;
2291 #endif
2292 default: abort ();
2293 }
2294
2295 #ifdef BFD64
2296 /* If BFD64, sign extend val for 32bit address mode. */
2297 if (flag_code != CODE_64BIT
2298 || i.prefix[ADDR_PREFIX])
2299 if ((val & ~(((addressT) 2 << 31) - 1)) == 0)
2300 val = (val ^ ((addressT) 1 << 31)) - ((addressT) 1 << 31);
2301 #endif
2302
2303 if ((val & ~mask) != 0 && (val & ~mask) != ~mask)
2304 {
2305 char buf1[40], buf2[40];
2306
2307 sprint_value (buf1, val);
2308 sprint_value (buf2, val & mask);
2309 as_warn (_("%s shortened to %s"), buf1, buf2);
2310 }
2311 return val & mask;
2312 }
2313
2314 enum PREFIX_GROUP
2315 {
2316 PREFIX_EXIST = 0,
2317 PREFIX_LOCK,
2318 PREFIX_REP,
2319 PREFIX_DS,
2320 PREFIX_OTHER
2321 };
2322
2323 /* Returns
2324 a. PREFIX_EXIST if attempting to add a prefix where one from the
2325 same class already exists.
2326 b. PREFIX_LOCK if lock prefix is added.
2327 c. PREFIX_REP if rep/repne prefix is added.
2328 d. PREFIX_DS if ds prefix is added.
2329 e. PREFIX_OTHER if other prefix is added.
2330 */
2331
2332 static enum PREFIX_GROUP
2333 add_prefix (unsigned int prefix)
2334 {
2335 enum PREFIX_GROUP ret = PREFIX_OTHER;
2336 unsigned int q;
2337
2338 if (prefix >= REX_OPCODE && prefix < REX_OPCODE + 16
2339 && flag_code == CODE_64BIT)
2340 {
2341 if ((i.prefix[REX_PREFIX] & prefix & REX_W)
2342 || (i.prefix[REX_PREFIX] & prefix & REX_R)
2343 || (i.prefix[REX_PREFIX] & prefix & REX_X)
2344 || (i.prefix[REX_PREFIX] & prefix & REX_B))
2345 ret = PREFIX_EXIST;
2346 q = REX_PREFIX;
2347 }
2348 else
2349 {
2350 switch (prefix)
2351 {
2352 default:
2353 abort ();
2354
2355 case DS_PREFIX_OPCODE:
2356 ret = PREFIX_DS;
2357 /* Fall through. */
2358 case CS_PREFIX_OPCODE:
2359 case ES_PREFIX_OPCODE:
2360 case FS_PREFIX_OPCODE:
2361 case GS_PREFIX_OPCODE:
2362 case SS_PREFIX_OPCODE:
2363 q = SEG_PREFIX;
2364 break;
2365
2366 case REPNE_PREFIX_OPCODE:
2367 case REPE_PREFIX_OPCODE:
2368 q = REP_PREFIX;
2369 ret = PREFIX_REP;
2370 break;
2371
2372 case LOCK_PREFIX_OPCODE:
2373 q = LOCK_PREFIX;
2374 ret = PREFIX_LOCK;
2375 break;
2376
2377 case FWAIT_OPCODE:
2378 q = WAIT_PREFIX;
2379 break;
2380
2381 case ADDR_PREFIX_OPCODE:
2382 q = ADDR_PREFIX;
2383 break;
2384
2385 case DATA_PREFIX_OPCODE:
2386 q = DATA_PREFIX;
2387 break;
2388 }
2389 if (i.prefix[q] != 0)
2390 ret = PREFIX_EXIST;
2391 }
2392
2393 if (ret)
2394 {
2395 if (!i.prefix[q])
2396 ++i.prefixes;
2397 i.prefix[q] |= prefix;
2398 }
2399 else
2400 as_bad (_("same type of prefix used twice"));
2401
2402 return ret;
2403 }
2404
2405 static void
2406 update_code_flag (int value, int check)
2407 {
2408 PRINTF_LIKE ((*as_error));
2409
2410 flag_code = (enum flag_code) value;
2411 if (flag_code == CODE_64BIT)
2412 {
2413 cpu_arch_flags.bitfield.cpu64 = 1;
2414 cpu_arch_flags.bitfield.cpuno64 = 0;
2415 }
2416 else
2417 {
2418 cpu_arch_flags.bitfield.cpu64 = 0;
2419 cpu_arch_flags.bitfield.cpuno64 = 1;
2420 }
2421 if (value == CODE_64BIT && !cpu_arch_flags.bitfield.cpulm )
2422 {
2423 if (check)
2424 as_error = as_fatal;
2425 else
2426 as_error = as_bad;
2427 (*as_error) (_("64bit mode not supported on `%s'."),
2428 cpu_arch_name ? cpu_arch_name : default_arch);
2429 }
2430 if (value == CODE_32BIT && !cpu_arch_flags.bitfield.cpui386)
2431 {
2432 if (check)
2433 as_error = as_fatal;
2434 else
2435 as_error = as_bad;
2436 (*as_error) (_("32bit mode not supported on `%s'."),
2437 cpu_arch_name ? cpu_arch_name : default_arch);
2438 }
2439 stackop_size = '\0';
2440 }
2441
2442 static void
2443 set_code_flag (int value)
2444 {
2445 update_code_flag (value, 0);
2446 }
2447
2448 static void
2449 set_16bit_gcc_code_flag (int new_code_flag)
2450 {
2451 flag_code = (enum flag_code) new_code_flag;
2452 if (flag_code != CODE_16BIT)
2453 abort ();
2454 cpu_arch_flags.bitfield.cpu64 = 0;
2455 cpu_arch_flags.bitfield.cpuno64 = 1;
2456 stackop_size = LONG_MNEM_SUFFIX;
2457 }
2458
2459 static void
2460 set_intel_syntax (int syntax_flag)
2461 {
2462 /* Find out if register prefixing is specified. */
2463 int ask_naked_reg = 0;
2464
2465 SKIP_WHITESPACE ();
2466 if (!is_end_of_line[(unsigned char) *input_line_pointer])
2467 {
2468 char *string;
2469 int e = get_symbol_name (&string);
2470
2471 if (strcmp (string, "prefix") == 0)
2472 ask_naked_reg = 1;
2473 else if (strcmp (string, "noprefix") == 0)
2474 ask_naked_reg = -1;
2475 else
2476 as_bad (_("bad argument to syntax directive."));
2477 (void) restore_line_pointer (e);
2478 }
2479 demand_empty_rest_of_line ();
2480
2481 intel_syntax = syntax_flag;
2482
2483 if (ask_naked_reg == 0)
2484 allow_naked_reg = (intel_syntax
2485 && (bfd_get_symbol_leading_char (stdoutput) != '\0'));
2486 else
2487 allow_naked_reg = (ask_naked_reg < 0);
2488
2489 expr_set_rank (O_full_ptr, syntax_flag ? 10 : 0);
2490
2491 identifier_chars['%'] = intel_syntax && allow_naked_reg ? '%' : 0;
2492 identifier_chars['$'] = intel_syntax ? '$' : 0;
2493 register_prefix = allow_naked_reg ? "" : "%";
2494 }
2495
2496 static void
2497 set_intel_mnemonic (int mnemonic_flag)
2498 {
2499 intel_mnemonic = mnemonic_flag;
2500 }
2501
2502 static void
2503 set_allow_index_reg (int flag)
2504 {
2505 allow_index_reg = flag;
2506 }
2507
2508 static void
2509 set_check (int what)
2510 {
2511 enum check_kind *kind;
2512 const char *str;
2513
2514 if (what)
2515 {
2516 kind = &operand_check;
2517 str = "operand";
2518 }
2519 else
2520 {
2521 kind = &sse_check;
2522 str = "sse";
2523 }
2524
2525 SKIP_WHITESPACE ();
2526
2527 if (!is_end_of_line[(unsigned char) *input_line_pointer])
2528 {
2529 char *string;
2530 int e = get_symbol_name (&string);
2531
2532 if (strcmp (string, "none") == 0)
2533 *kind = check_none;
2534 else if (strcmp (string, "warning") == 0)
2535 *kind = check_warning;
2536 else if (strcmp (string, "error") == 0)
2537 *kind = check_error;
2538 else
2539 as_bad (_("bad argument to %s_check directive."), str);
2540 (void) restore_line_pointer (e);
2541 }
2542 else
2543 as_bad (_("missing argument for %s_check directive"), str);
2544
2545 demand_empty_rest_of_line ();
2546 }
2547
2548 static void
2549 check_cpu_arch_compatible (const char *name ATTRIBUTE_UNUSED,
2550 i386_cpu_flags new_flag ATTRIBUTE_UNUSED)
2551 {
2552 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
2553 static const char *arch;
2554
2555 /* Intel LIOM is only supported on ELF. */
2556 if (!IS_ELF)
2557 return;
2558
2559 if (!arch)
2560 {
2561 /* Use cpu_arch_name if it is set in md_parse_option. Otherwise
2562 use default_arch. */
2563 arch = cpu_arch_name;
2564 if (!arch)
2565 arch = default_arch;
2566 }
2567
2568 /* If we are targeting Intel MCU, we must enable it. */
2569 if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_IAMCU
2570 || new_flag.bitfield.cpuiamcu)
2571 return;
2572
2573 /* If we are targeting Intel L1OM, we must enable it. */
2574 if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_L1OM
2575 || new_flag.bitfield.cpul1om)
2576 return;
2577
2578 /* If we are targeting Intel K1OM, we must enable it. */
2579 if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_K1OM
2580 || new_flag.bitfield.cpuk1om)
2581 return;
2582
2583 as_bad (_("`%s' is not supported on `%s'"), name, arch);
2584 #endif
2585 }
2586
2587 static void
2588 set_cpu_arch (int dummy ATTRIBUTE_UNUSED)
2589 {
2590 SKIP_WHITESPACE ();
2591
2592 if (!is_end_of_line[(unsigned char) *input_line_pointer])
2593 {
2594 char *string;
2595 int e = get_symbol_name (&string);
2596 unsigned int j;
2597 i386_cpu_flags flags;
2598
2599 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
2600 {
2601 if (strcmp (string, cpu_arch[j].name) == 0)
2602 {
2603 check_cpu_arch_compatible (string, cpu_arch[j].flags);
2604
2605 if (*string != '.')
2606 {
2607 cpu_arch_name = cpu_arch[j].name;
2608 cpu_sub_arch_name = NULL;
2609 cpu_arch_flags = cpu_arch[j].flags;
2610 if (flag_code == CODE_64BIT)
2611 {
2612 cpu_arch_flags.bitfield.cpu64 = 1;
2613 cpu_arch_flags.bitfield.cpuno64 = 0;
2614 }
2615 else
2616 {
2617 cpu_arch_flags.bitfield.cpu64 = 0;
2618 cpu_arch_flags.bitfield.cpuno64 = 1;
2619 }
2620 cpu_arch_isa = cpu_arch[j].type;
2621 cpu_arch_isa_flags = cpu_arch[j].flags;
2622 if (!cpu_arch_tune_set)
2623 {
2624 cpu_arch_tune = cpu_arch_isa;
2625 cpu_arch_tune_flags = cpu_arch_isa_flags;
2626 }
2627 break;
2628 }
2629
2630 flags = cpu_flags_or (cpu_arch_flags,
2631 cpu_arch[j].flags);
2632
2633 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
2634 {
2635 if (cpu_sub_arch_name)
2636 {
2637 char *name = cpu_sub_arch_name;
2638 cpu_sub_arch_name = concat (name,
2639 cpu_arch[j].name,
2640 (const char *) NULL);
2641 free (name);
2642 }
2643 else
2644 cpu_sub_arch_name = xstrdup (cpu_arch[j].name);
2645 cpu_arch_flags = flags;
2646 cpu_arch_isa_flags = flags;
2647 }
2648 else
2649 cpu_arch_isa_flags
2650 = cpu_flags_or (cpu_arch_isa_flags,
2651 cpu_arch[j].flags);
2652 (void) restore_line_pointer (e);
2653 demand_empty_rest_of_line ();
2654 return;
2655 }
2656 }
2657
2658 if (*string == '.' && j >= ARRAY_SIZE (cpu_arch))
2659 {
2660 /* Disable an ISA extension. */
2661 for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
2662 if (strcmp (string + 1, cpu_noarch [j].name) == 0)
2663 {
2664 flags = cpu_flags_and_not (cpu_arch_flags,
2665 cpu_noarch[j].flags);
2666 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
2667 {
2668 if (cpu_sub_arch_name)
2669 {
2670 char *name = cpu_sub_arch_name;
2671 cpu_sub_arch_name = concat (name, string,
2672 (const char *) NULL);
2673 free (name);
2674 }
2675 else
2676 cpu_sub_arch_name = xstrdup (string);
2677 cpu_arch_flags = flags;
2678 cpu_arch_isa_flags = flags;
2679 }
2680 (void) restore_line_pointer (e);
2681 demand_empty_rest_of_line ();
2682 return;
2683 }
2684
2685 j = ARRAY_SIZE (cpu_arch);
2686 }
2687
2688 if (j >= ARRAY_SIZE (cpu_arch))
2689 as_bad (_("no such architecture: `%s'"), string);
2690
2691 *input_line_pointer = e;
2692 }
2693 else
2694 as_bad (_("missing cpu architecture"));
2695
2696 no_cond_jump_promotion = 0;
2697 if (*input_line_pointer == ','
2698 && !is_end_of_line[(unsigned char) input_line_pointer[1]])
2699 {
2700 char *string;
2701 char e;
2702
2703 ++input_line_pointer;
2704 e = get_symbol_name (&string);
2705
2706 if (strcmp (string, "nojumps") == 0)
2707 no_cond_jump_promotion = 1;
2708 else if (strcmp (string, "jumps") == 0)
2709 ;
2710 else
2711 as_bad (_("no such architecture modifier: `%s'"), string);
2712
2713 (void) restore_line_pointer (e);
2714 }
2715
2716 demand_empty_rest_of_line ();
2717 }
2718
2719 enum bfd_architecture
2720 i386_arch (void)
2721 {
2722 if (cpu_arch_isa == PROCESSOR_L1OM)
2723 {
2724 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2725 || flag_code != CODE_64BIT)
2726 as_fatal (_("Intel L1OM is 64bit ELF only"));
2727 return bfd_arch_l1om;
2728 }
2729 else if (cpu_arch_isa == PROCESSOR_K1OM)
2730 {
2731 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2732 || flag_code != CODE_64BIT)
2733 as_fatal (_("Intel K1OM is 64bit ELF only"));
2734 return bfd_arch_k1om;
2735 }
2736 else if (cpu_arch_isa == PROCESSOR_IAMCU)
2737 {
2738 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2739 || flag_code == CODE_64BIT)
2740 as_fatal (_("Intel MCU is 32bit ELF only"));
2741 return bfd_arch_iamcu;
2742 }
2743 else
2744 return bfd_arch_i386;
2745 }
2746
2747 unsigned long
2748 i386_mach (void)
2749 {
2750 if (!strncmp (default_arch, "x86_64", 6))
2751 {
2752 if (cpu_arch_isa == PROCESSOR_L1OM)
2753 {
2754 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2755 || default_arch[6] != '\0')
2756 as_fatal (_("Intel L1OM is 64bit ELF only"));
2757 return bfd_mach_l1om;
2758 }
2759 else if (cpu_arch_isa == PROCESSOR_K1OM)
2760 {
2761 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2762 || default_arch[6] != '\0')
2763 as_fatal (_("Intel K1OM is 64bit ELF only"));
2764 return bfd_mach_k1om;
2765 }
2766 else if (default_arch[6] == '\0')
2767 return bfd_mach_x86_64;
2768 else
2769 return bfd_mach_x64_32;
2770 }
2771 else if (!strcmp (default_arch, "i386")
2772 || !strcmp (default_arch, "iamcu"))
2773 {
2774 if (cpu_arch_isa == PROCESSOR_IAMCU)
2775 {
2776 if (OUTPUT_FLAVOR != bfd_target_elf_flavour)
2777 as_fatal (_("Intel MCU is 32bit ELF only"));
2778 return bfd_mach_i386_iamcu;
2779 }
2780 else
2781 return bfd_mach_i386_i386;
2782 }
2783 else
2784 as_fatal (_("unknown architecture"));
2785 }
2786 \f
2787 void
2788 md_begin (void)
2789 {
2790 const char *hash_err;
2791
2792 /* Support pseudo prefixes like {disp32}. */
2793 lex_type ['{'] = LEX_BEGIN_NAME;
2794
2795 /* Initialize op_hash hash table. */
2796 op_hash = hash_new ();
2797
2798 {
2799 const insn_template *optab;
2800 templates *core_optab;
2801
2802 /* Setup for loop. */
2803 optab = i386_optab;
2804 core_optab = XNEW (templates);
2805 core_optab->start = optab;
2806
2807 while (1)
2808 {
2809 ++optab;
2810 if (optab->name == NULL
2811 || strcmp (optab->name, (optab - 1)->name) != 0)
2812 {
2813 /* different name --> ship out current template list;
2814 add to hash table; & begin anew. */
2815 core_optab->end = optab;
2816 hash_err = hash_insert (op_hash,
2817 (optab - 1)->name,
2818 (void *) core_optab);
2819 if (hash_err)
2820 {
2821 as_fatal (_("can't hash %s: %s"),
2822 (optab - 1)->name,
2823 hash_err);
2824 }
2825 if (optab->name == NULL)
2826 break;
2827 core_optab = XNEW (templates);
2828 core_optab->start = optab;
2829 }
2830 }
2831 }
2832
2833 /* Initialize reg_hash hash table. */
2834 reg_hash = hash_new ();
2835 {
2836 const reg_entry *regtab;
2837 unsigned int regtab_size = i386_regtab_size;
2838
2839 for (regtab = i386_regtab; regtab_size--; regtab++)
2840 {
2841 hash_err = hash_insert (reg_hash, regtab->reg_name, (void *) regtab);
2842 if (hash_err)
2843 as_fatal (_("can't hash %s: %s"),
2844 regtab->reg_name,
2845 hash_err);
2846 }
2847 }
2848
2849 /* Fill in lexical tables: mnemonic_chars, operand_chars. */
2850 {
2851 int c;
2852 char *p;
2853
2854 for (c = 0; c < 256; c++)
2855 {
2856 if (ISDIGIT (c))
2857 {
2858 digit_chars[c] = c;
2859 mnemonic_chars[c] = c;
2860 register_chars[c] = c;
2861 operand_chars[c] = c;
2862 }
2863 else if (ISLOWER (c))
2864 {
2865 mnemonic_chars[c] = c;
2866 register_chars[c] = c;
2867 operand_chars[c] = c;
2868 }
2869 else if (ISUPPER (c))
2870 {
2871 mnemonic_chars[c] = TOLOWER (c);
2872 register_chars[c] = mnemonic_chars[c];
2873 operand_chars[c] = c;
2874 }
2875 else if (c == '{' || c == '}')
2876 {
2877 mnemonic_chars[c] = c;
2878 operand_chars[c] = c;
2879 }
2880
2881 if (ISALPHA (c) || ISDIGIT (c))
2882 identifier_chars[c] = c;
2883 else if (c >= 128)
2884 {
2885 identifier_chars[c] = c;
2886 operand_chars[c] = c;
2887 }
2888 }
2889
2890 #ifdef LEX_AT
2891 identifier_chars['@'] = '@';
2892 #endif
2893 #ifdef LEX_QM
2894 identifier_chars['?'] = '?';
2895 operand_chars['?'] = '?';
2896 #endif
2897 digit_chars['-'] = '-';
2898 mnemonic_chars['_'] = '_';
2899 mnemonic_chars['-'] = '-';
2900 mnemonic_chars['.'] = '.';
2901 identifier_chars['_'] = '_';
2902 identifier_chars['.'] = '.';
2903
2904 for (p = operand_special_chars; *p != '\0'; p++)
2905 operand_chars[(unsigned char) *p] = *p;
2906 }
2907
2908 if (flag_code == CODE_64BIT)
2909 {
2910 #if defined (OBJ_COFF) && defined (TE_PE)
2911 x86_dwarf2_return_column = (OUTPUT_FLAVOR == bfd_target_coff_flavour
2912 ? 32 : 16);
2913 #else
2914 x86_dwarf2_return_column = 16;
2915 #endif
2916 x86_cie_data_alignment = -8;
2917 }
2918 else
2919 {
2920 x86_dwarf2_return_column = 8;
2921 x86_cie_data_alignment = -4;
2922 }
2923 }
2924
2925 void
2926 i386_print_statistics (FILE *file)
2927 {
2928 hash_print_statistics (file, "i386 opcode", op_hash);
2929 hash_print_statistics (file, "i386 register", reg_hash);
2930 }
2931 \f
2932 #ifdef DEBUG386
2933
2934 /* Debugging routines for md_assemble. */
2935 static void pte (insn_template *);
2936 static void pt (i386_operand_type);
2937 static void pe (expressionS *);
2938 static void ps (symbolS *);
2939
2940 static void
2941 pi (char *line, i386_insn *x)
2942 {
2943 unsigned int j;
2944
2945 fprintf (stdout, "%s: template ", line);
2946 pte (&x->tm);
2947 fprintf (stdout, " address: base %s index %s scale %x\n",
2948 x->base_reg ? x->base_reg->reg_name : "none",
2949 x->index_reg ? x->index_reg->reg_name : "none",
2950 x->log2_scale_factor);
2951 fprintf (stdout, " modrm: mode %x reg %x reg/mem %x\n",
2952 x->rm.mode, x->rm.reg, x->rm.regmem);
2953 fprintf (stdout, " sib: base %x index %x scale %x\n",
2954 x->sib.base, x->sib.index, x->sib.scale);
2955 fprintf (stdout, " rex: 64bit %x extX %x extY %x extZ %x\n",
2956 (x->rex & REX_W) != 0,
2957 (x->rex & REX_R) != 0,
2958 (x->rex & REX_X) != 0,
2959 (x->rex & REX_B) != 0);
2960 for (j = 0; j < x->operands; j++)
2961 {
2962 fprintf (stdout, " #%d: ", j + 1);
2963 pt (x->types[j]);
2964 fprintf (stdout, "\n");
2965 if (x->types[j].bitfield.reg
2966 || x->types[j].bitfield.regmmx
2967 || x->types[j].bitfield.regsimd
2968 || x->types[j].bitfield.sreg2
2969 || x->types[j].bitfield.sreg3
2970 || x->types[j].bitfield.control
2971 || x->types[j].bitfield.debug
2972 || x->types[j].bitfield.test)
2973 fprintf (stdout, "%s\n", x->op[j].regs->reg_name);
2974 if (operand_type_check (x->types[j], imm))
2975 pe (x->op[j].imms);
2976 if (operand_type_check (x->types[j], disp))
2977 pe (x->op[j].disps);
2978 }
2979 }
2980
2981 static void
2982 pte (insn_template *t)
2983 {
2984 unsigned int j;
2985 fprintf (stdout, " %d operands ", t->operands);
2986 fprintf (stdout, "opcode %x ", t->base_opcode);
2987 if (t->extension_opcode != None)
2988 fprintf (stdout, "ext %x ", t->extension_opcode);
2989 if (t->opcode_modifier.d)
2990 fprintf (stdout, "D");
2991 if (t->opcode_modifier.w)
2992 fprintf (stdout, "W");
2993 fprintf (stdout, "\n");
2994 for (j = 0; j < t->operands; j++)
2995 {
2996 fprintf (stdout, " #%d type ", j + 1);
2997 pt (t->operand_types[j]);
2998 fprintf (stdout, "\n");
2999 }
3000 }
3001
3002 static void
3003 pe (expressionS *e)
3004 {
3005 fprintf (stdout, " operation %d\n", e->X_op);
3006 fprintf (stdout, " add_number %ld (%lx)\n",
3007 (long) e->X_add_number, (long) e->X_add_number);
3008 if (e->X_add_symbol)
3009 {
3010 fprintf (stdout, " add_symbol ");
3011 ps (e->X_add_symbol);
3012 fprintf (stdout, "\n");
3013 }
3014 if (e->X_op_symbol)
3015 {
3016 fprintf (stdout, " op_symbol ");
3017 ps (e->X_op_symbol);
3018 fprintf (stdout, "\n");
3019 }
3020 }
3021
3022 static void
3023 ps (symbolS *s)
3024 {
3025 fprintf (stdout, "%s type %s%s",
3026 S_GET_NAME (s),
3027 S_IS_EXTERNAL (s) ? "EXTERNAL " : "",
3028 segment_name (S_GET_SEGMENT (s)));
3029 }
3030
3031 static struct type_name
3032 {
3033 i386_operand_type mask;
3034 const char *name;
3035 }
3036 const type_names[] =
3037 {
3038 { OPERAND_TYPE_REG8, "r8" },
3039 { OPERAND_TYPE_REG16, "r16" },
3040 { OPERAND_TYPE_REG32, "r32" },
3041 { OPERAND_TYPE_REG64, "r64" },
3042 { OPERAND_TYPE_IMM8, "i8" },
3043 { OPERAND_TYPE_IMM8, "i8s" },
3044 { OPERAND_TYPE_IMM16, "i16" },
3045 { OPERAND_TYPE_IMM32, "i32" },
3046 { OPERAND_TYPE_IMM32S, "i32s" },
3047 { OPERAND_TYPE_IMM64, "i64" },
3048 { OPERAND_TYPE_IMM1, "i1" },
3049 { OPERAND_TYPE_BASEINDEX, "BaseIndex" },
3050 { OPERAND_TYPE_DISP8, "d8" },
3051 { OPERAND_TYPE_DISP16, "d16" },
3052 { OPERAND_TYPE_DISP32, "d32" },
3053 { OPERAND_TYPE_DISP32S, "d32s" },
3054 { OPERAND_TYPE_DISP64, "d64" },
3055 { OPERAND_TYPE_INOUTPORTREG, "InOutPortReg" },
3056 { OPERAND_TYPE_SHIFTCOUNT, "ShiftCount" },
3057 { OPERAND_TYPE_CONTROL, "control reg" },
3058 { OPERAND_TYPE_TEST, "test reg" },
3059 { OPERAND_TYPE_DEBUG, "debug reg" },
3060 { OPERAND_TYPE_FLOATREG, "FReg" },
3061 { OPERAND_TYPE_FLOATACC, "FAcc" },
3062 { OPERAND_TYPE_SREG2, "SReg2" },
3063 { OPERAND_TYPE_SREG3, "SReg3" },
3064 { OPERAND_TYPE_ACC, "Acc" },
3065 { OPERAND_TYPE_JUMPABSOLUTE, "Jump Absolute" },
3066 { OPERAND_TYPE_REGMMX, "rMMX" },
3067 { OPERAND_TYPE_REGXMM, "rXMM" },
3068 { OPERAND_TYPE_REGYMM, "rYMM" },
3069 { OPERAND_TYPE_REGZMM, "rZMM" },
3070 { OPERAND_TYPE_REGMASK, "Mask reg" },
3071 { OPERAND_TYPE_ESSEG, "es" },
3072 };
3073
3074 static void
3075 pt (i386_operand_type t)
3076 {
3077 unsigned int j;
3078 i386_operand_type a;
3079
3080 for (j = 0; j < ARRAY_SIZE (type_names); j++)
3081 {
3082 a = operand_type_and (t, type_names[j].mask);
3083 if (!operand_type_all_zero (&a))
3084 fprintf (stdout, "%s, ", type_names[j].name);
3085 }
3086 fflush (stdout);
3087 }
3088
3089 #endif /* DEBUG386 */
3090 \f
3091 static bfd_reloc_code_real_type
3092 reloc (unsigned int size,
3093 int pcrel,
3094 int sign,
3095 bfd_reloc_code_real_type other)
3096 {
3097 if (other != NO_RELOC)
3098 {
3099 reloc_howto_type *rel;
3100
3101 if (size == 8)
3102 switch (other)
3103 {
3104 case BFD_RELOC_X86_64_GOT32:
3105 return BFD_RELOC_X86_64_GOT64;
3106 break;
3107 case BFD_RELOC_X86_64_GOTPLT64:
3108 return BFD_RELOC_X86_64_GOTPLT64;
3109 break;
3110 case BFD_RELOC_X86_64_PLTOFF64:
3111 return BFD_RELOC_X86_64_PLTOFF64;
3112 break;
3113 case BFD_RELOC_X86_64_GOTPC32:
3114 other = BFD_RELOC_X86_64_GOTPC64;
3115 break;
3116 case BFD_RELOC_X86_64_GOTPCREL:
3117 other = BFD_RELOC_X86_64_GOTPCREL64;
3118 break;
3119 case BFD_RELOC_X86_64_TPOFF32:
3120 other = BFD_RELOC_X86_64_TPOFF64;
3121 break;
3122 case BFD_RELOC_X86_64_DTPOFF32:
3123 other = BFD_RELOC_X86_64_DTPOFF64;
3124 break;
3125 default:
3126 break;
3127 }
3128
3129 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
3130 if (other == BFD_RELOC_SIZE32)
3131 {
3132 if (size == 8)
3133 other = BFD_RELOC_SIZE64;
3134 if (pcrel)
3135 {
3136 as_bad (_("there are no pc-relative size relocations"));
3137 return NO_RELOC;
3138 }
3139 }
3140 #endif
3141
3142 /* Sign-checking 4-byte relocations in 16-/32-bit code is pointless. */
3143 if (size == 4 && (flag_code != CODE_64BIT || disallow_64bit_reloc))
3144 sign = -1;
3145
3146 rel = bfd_reloc_type_lookup (stdoutput, other);
3147 if (!rel)
3148 as_bad (_("unknown relocation (%u)"), other);
3149 else if (size != bfd_get_reloc_size (rel))
3150 as_bad (_("%u-byte relocation cannot be applied to %u-byte field"),
3151 bfd_get_reloc_size (rel),
3152 size);
3153 else if (pcrel && !rel->pc_relative)
3154 as_bad (_("non-pc-relative relocation for pc-relative field"));
3155 else if ((rel->complain_on_overflow == complain_overflow_signed
3156 && !sign)
3157 || (rel->complain_on_overflow == complain_overflow_unsigned
3158 && sign > 0))
3159 as_bad (_("relocated field and relocation type differ in signedness"));
3160 else
3161 return other;
3162 return NO_RELOC;
3163 }
3164
3165 if (pcrel)
3166 {
3167 if (!sign)
3168 as_bad (_("there are no unsigned pc-relative relocations"));
3169 switch (size)
3170 {
3171 case 1: return BFD_RELOC_8_PCREL;
3172 case 2: return BFD_RELOC_16_PCREL;
3173 case 4: return BFD_RELOC_32_PCREL;
3174 case 8: return BFD_RELOC_64_PCREL;
3175 }
3176 as_bad (_("cannot do %u byte pc-relative relocation"), size);
3177 }
3178 else
3179 {
3180 if (sign > 0)
3181 switch (size)
3182 {
3183 case 4: return BFD_RELOC_X86_64_32S;
3184 }
3185 else
3186 switch (size)
3187 {
3188 case 1: return BFD_RELOC_8;
3189 case 2: return BFD_RELOC_16;
3190 case 4: return BFD_RELOC_32;
3191 case 8: return BFD_RELOC_64;
3192 }
3193 as_bad (_("cannot do %s %u byte relocation"),
3194 sign > 0 ? "signed" : "unsigned", size);
3195 }
3196
3197 return NO_RELOC;
3198 }
3199
3200 /* Here we decide which fixups can be adjusted to make them relative to
3201 the beginning of the section instead of the symbol. Basically we need
3202 to make sure that the dynamic relocations are done correctly, so in
3203 some cases we force the original symbol to be used. */
3204
3205 int
3206 tc_i386_fix_adjustable (fixS *fixP ATTRIBUTE_UNUSED)
3207 {
3208 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
3209 if (!IS_ELF)
3210 return 1;
3211
3212 /* Don't adjust pc-relative references to merge sections in 64-bit
3213 mode. */
3214 if (use_rela_relocations
3215 && (S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_MERGE) != 0
3216 && fixP->fx_pcrel)
3217 return 0;
3218
3219 /* The x86_64 GOTPCREL are represented as 32bit PCrel relocations
3220 and changed later by validate_fix. */
3221 if (GOT_symbol && fixP->fx_subsy == GOT_symbol
3222 && fixP->fx_r_type == BFD_RELOC_32_PCREL)
3223 return 0;
3224
3225 /* Adjust_reloc_syms doesn't know about the GOT. Need to keep symbol
3226 for size relocations. */
3227 if (fixP->fx_r_type == BFD_RELOC_SIZE32
3228 || fixP->fx_r_type == BFD_RELOC_SIZE64
3229 || fixP->fx_r_type == BFD_RELOC_386_GOTOFF
3230 || fixP->fx_r_type == BFD_RELOC_386_PLT32
3231 || fixP->fx_r_type == BFD_RELOC_386_GOT32
3232 || fixP->fx_r_type == BFD_RELOC_386_GOT32X
3233 || fixP->fx_r_type == BFD_RELOC_386_TLS_GD
3234 || fixP->fx_r_type == BFD_RELOC_386_TLS_LDM
3235 || fixP->fx_r_type == BFD_RELOC_386_TLS_LDO_32
3236 || fixP->fx_r_type == BFD_RELOC_386_TLS_IE_32
3237 || fixP->fx_r_type == BFD_RELOC_386_TLS_IE
3238 || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTIE
3239 || fixP->fx_r_type == BFD_RELOC_386_TLS_LE_32
3240 || fixP->fx_r_type == BFD_RELOC_386_TLS_LE
3241 || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTDESC
3242 || fixP->fx_r_type == BFD_RELOC_386_TLS_DESC_CALL
3243 || fixP->fx_r_type == BFD_RELOC_X86_64_PLT32
3244 || fixP->fx_r_type == BFD_RELOC_X86_64_GOT32
3245 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCREL
3246 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCRELX
3247 || fixP->fx_r_type == BFD_RELOC_X86_64_REX_GOTPCRELX
3248 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSGD
3249 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSLD
3250 || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF32
3251 || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF64
3252 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTTPOFF
3253 || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF32
3254 || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF64
3255 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTOFF64
3256 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPC32_TLSDESC
3257 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSDESC_CALL
3258 || fixP->fx_r_type == BFD_RELOC_VTABLE_INHERIT
3259 || fixP->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
3260 return 0;
3261 #endif
3262 return 1;
3263 }
3264
3265 static int
3266 intel_float_operand (const char *mnemonic)
3267 {
3268 /* Note that the value returned is meaningful only for opcodes with (memory)
3269 operands, hence the code here is free to improperly handle opcodes that
3270 have no operands (for better performance and smaller code). */
3271
3272 if (mnemonic[0] != 'f')
3273 return 0; /* non-math */
3274
3275 switch (mnemonic[1])
3276 {
3277 /* fclex, fdecstp, fdisi, femms, feni, fincstp, finit, fsetpm, and
3278 the fs segment override prefix not currently handled because no
3279 call path can make opcodes without operands get here */
3280 case 'i':
3281 return 2 /* integer op */;
3282 case 'l':
3283 if (mnemonic[2] == 'd' && (mnemonic[3] == 'c' || mnemonic[3] == 'e'))
3284 return 3; /* fldcw/fldenv */
3285 break;
3286 case 'n':
3287 if (mnemonic[2] != 'o' /* fnop */)
3288 return 3; /* non-waiting control op */
3289 break;
3290 case 'r':
3291 if (mnemonic[2] == 's')
3292 return 3; /* frstor/frstpm */
3293 break;
3294 case 's':
3295 if (mnemonic[2] == 'a')
3296 return 3; /* fsave */
3297 if (mnemonic[2] == 't')
3298 {
3299 switch (mnemonic[3])
3300 {
3301 case 'c': /* fstcw */
3302 case 'd': /* fstdw */
3303 case 'e': /* fstenv */
3304 case 's': /* fsts[gw] */
3305 return 3;
3306 }
3307 }
3308 break;
3309 case 'x':
3310 if (mnemonic[2] == 'r' || mnemonic[2] == 's')
3311 return 0; /* fxsave/fxrstor are not really math ops */
3312 break;
3313 }
3314
3315 return 1;
3316 }
3317
3318 /* Build the VEX prefix. */
3319
3320 static void
3321 build_vex_prefix (const insn_template *t)
3322 {
3323 unsigned int register_specifier;
3324 unsigned int implied_prefix;
3325 unsigned int vector_length;
3326
3327 /* Check register specifier. */
3328 if (i.vex.register_specifier)
3329 {
3330 register_specifier =
3331 ~register_number (i.vex.register_specifier) & 0xf;
3332 gas_assert ((i.vex.register_specifier->reg_flags & RegVRex) == 0);
3333 }
3334 else
3335 register_specifier = 0xf;
3336
3337 /* Use 2-byte VEX prefix by swapping destination and source
3338 operand. */
3339 if (i.vec_encoding != vex_encoding_vex3
3340 && i.dir_encoding == dir_encoding_default
3341 && i.operands == i.reg_operands
3342 && i.tm.opcode_modifier.vexopcode == VEX0F
3343 && i.tm.opcode_modifier.load
3344 && i.rex == REX_B)
3345 {
3346 unsigned int xchg = i.operands - 1;
3347 union i386_op temp_op;
3348 i386_operand_type temp_type;
3349
3350 temp_type = i.types[xchg];
3351 i.types[xchg] = i.types[0];
3352 i.types[0] = temp_type;
3353 temp_op = i.op[xchg];
3354 i.op[xchg] = i.op[0];
3355 i.op[0] = temp_op;
3356
3357 gas_assert (i.rm.mode == 3);
3358
3359 i.rex = REX_R;
3360 xchg = i.rm.regmem;
3361 i.rm.regmem = i.rm.reg;
3362 i.rm.reg = xchg;
3363
3364 /* Use the next insn. */
3365 i.tm = t[1];
3366 }
3367
3368 if (i.tm.opcode_modifier.vex == VEXScalar)
3369 vector_length = avxscalar;
3370 else if (i.tm.opcode_modifier.vex == VEX256)
3371 vector_length = 1;
3372 else
3373 {
3374 unsigned int op;
3375
3376 /* Determine vector length from the last multi-length vector
3377 operand. */
3378 vector_length = 0;
3379 for (op = t->operands; op--;)
3380 if (t->operand_types[op].bitfield.xmmword
3381 && t->operand_types[op].bitfield.ymmword
3382 && i.types[op].bitfield.ymmword)
3383 {
3384 vector_length = 1;
3385 break;
3386 }
3387 }
3388
3389 switch ((i.tm.base_opcode >> 8) & 0xff)
3390 {
3391 case 0:
3392 implied_prefix = 0;
3393 break;
3394 case DATA_PREFIX_OPCODE:
3395 implied_prefix = 1;
3396 break;
3397 case REPE_PREFIX_OPCODE:
3398 implied_prefix = 2;
3399 break;
3400 case REPNE_PREFIX_OPCODE:
3401 implied_prefix = 3;
3402 break;
3403 default:
3404 abort ();
3405 }
3406
3407 /* Use 2-byte VEX prefix if possible. */
3408 if (i.vec_encoding != vex_encoding_vex3
3409 && i.tm.opcode_modifier.vexopcode == VEX0F
3410 && i.tm.opcode_modifier.vexw != VEXW1
3411 && (i.rex & (REX_W | REX_X | REX_B)) == 0)
3412 {
3413 /* 2-byte VEX prefix. */
3414 unsigned int r;
3415
3416 i.vex.length = 2;
3417 i.vex.bytes[0] = 0xc5;
3418
3419 /* Check the REX.R bit. */
3420 r = (i.rex & REX_R) ? 0 : 1;
3421 i.vex.bytes[1] = (r << 7
3422 | register_specifier << 3
3423 | vector_length << 2
3424 | implied_prefix);
3425 }
3426 else
3427 {
3428 /* 3-byte VEX prefix. */
3429 unsigned int m, w;
3430
3431 i.vex.length = 3;
3432
3433 switch (i.tm.opcode_modifier.vexopcode)
3434 {
3435 case VEX0F:
3436 m = 0x1;
3437 i.vex.bytes[0] = 0xc4;
3438 break;
3439 case VEX0F38:
3440 m = 0x2;
3441 i.vex.bytes[0] = 0xc4;
3442 break;
3443 case VEX0F3A:
3444 m = 0x3;
3445 i.vex.bytes[0] = 0xc4;
3446 break;
3447 case XOP08:
3448 m = 0x8;
3449 i.vex.bytes[0] = 0x8f;
3450 break;
3451 case XOP09:
3452 m = 0x9;
3453 i.vex.bytes[0] = 0x8f;
3454 break;
3455 case XOP0A:
3456 m = 0xa;
3457 i.vex.bytes[0] = 0x8f;
3458 break;
3459 default:
3460 abort ();
3461 }
3462
3463 /* The high 3 bits of the second VEX byte are 1's compliment
3464 of RXB bits from REX. */
3465 i.vex.bytes[1] = (~i.rex & 0x7) << 5 | m;
3466
3467 /* Check the REX.W bit. */
3468 w = (i.rex & REX_W) ? 1 : 0;
3469 if (i.tm.opcode_modifier.vexw == VEXW1)
3470 w = 1;
3471
3472 i.vex.bytes[2] = (w << 7
3473 | register_specifier << 3
3474 | vector_length << 2
3475 | implied_prefix);
3476 }
3477 }
3478
3479 static INLINE bfd_boolean
3480 is_evex_encoding (const insn_template *t)
3481 {
3482 return t->opcode_modifier.evex || t->opcode_modifier.disp8memshift
3483 || t->opcode_modifier.broadcast || t->opcode_modifier.masking
3484 || t->opcode_modifier.staticrounding || t->opcode_modifier.sae;
3485 }
3486
3487 static INLINE bfd_boolean
3488 is_any_vex_encoding (const insn_template *t)
3489 {
3490 return t->opcode_modifier.vex || t->opcode_modifier.vexopcode
3491 || is_evex_encoding (t);
3492 }
3493
3494 /* Build the EVEX prefix. */
3495
3496 static void
3497 build_evex_prefix (void)
3498 {
3499 unsigned int register_specifier;
3500 unsigned int implied_prefix;
3501 unsigned int m, w;
3502 rex_byte vrex_used = 0;
3503
3504 /* Check register specifier. */
3505 if (i.vex.register_specifier)
3506 {
3507 gas_assert ((i.vrex & REX_X) == 0);
3508
3509 register_specifier = i.vex.register_specifier->reg_num;
3510 if ((i.vex.register_specifier->reg_flags & RegRex))
3511 register_specifier += 8;
3512 /* The upper 16 registers are encoded in the fourth byte of the
3513 EVEX prefix. */
3514 if (!(i.vex.register_specifier->reg_flags & RegVRex))
3515 i.vex.bytes[3] = 0x8;
3516 register_specifier = ~register_specifier & 0xf;
3517 }
3518 else
3519 {
3520 register_specifier = 0xf;
3521
3522 /* Encode upper 16 vector index register in the fourth byte of
3523 the EVEX prefix. */
3524 if (!(i.vrex & REX_X))
3525 i.vex.bytes[3] = 0x8;
3526 else
3527 vrex_used |= REX_X;
3528 }
3529
3530 switch ((i.tm.base_opcode >> 8) & 0xff)
3531 {
3532 case 0:
3533 implied_prefix = 0;
3534 break;
3535 case DATA_PREFIX_OPCODE:
3536 implied_prefix = 1;
3537 break;
3538 case REPE_PREFIX_OPCODE:
3539 implied_prefix = 2;
3540 break;
3541 case REPNE_PREFIX_OPCODE:
3542 implied_prefix = 3;
3543 break;
3544 default:
3545 abort ();
3546 }
3547
3548 /* 4 byte EVEX prefix. */
3549 i.vex.length = 4;
3550 i.vex.bytes[0] = 0x62;
3551
3552 /* mmmm bits. */
3553 switch (i.tm.opcode_modifier.vexopcode)
3554 {
3555 case VEX0F:
3556 m = 1;
3557 break;
3558 case VEX0F38:
3559 m = 2;
3560 break;
3561 case VEX0F3A:
3562 m = 3;
3563 break;
3564 default:
3565 abort ();
3566 break;
3567 }
3568
3569 /* The high 3 bits of the second EVEX byte are 1's compliment of RXB
3570 bits from REX. */
3571 i.vex.bytes[1] = (~i.rex & 0x7) << 5 | m;
3572
3573 /* The fifth bit of the second EVEX byte is 1's compliment of the
3574 REX_R bit in VREX. */
3575 if (!(i.vrex & REX_R))
3576 i.vex.bytes[1] |= 0x10;
3577 else
3578 vrex_used |= REX_R;
3579
3580 if ((i.reg_operands + i.imm_operands) == i.operands)
3581 {
3582 /* When all operands are registers, the REX_X bit in REX is not
3583 used. We reuse it to encode the upper 16 registers, which is
3584 indicated by the REX_B bit in VREX. The REX_X bit is encoded
3585 as 1's compliment. */
3586 if ((i.vrex & REX_B))
3587 {
3588 vrex_used |= REX_B;
3589 i.vex.bytes[1] &= ~0x40;
3590 }
3591 }
3592
3593 /* EVEX instructions shouldn't need the REX prefix. */
3594 i.vrex &= ~vrex_used;
3595 gas_assert (i.vrex == 0);
3596
3597 /* Check the REX.W bit. */
3598 w = (i.rex & REX_W) ? 1 : 0;
3599 if (i.tm.opcode_modifier.vexw)
3600 {
3601 if (i.tm.opcode_modifier.vexw == VEXW1)
3602 w = 1;
3603 }
3604 /* If w is not set it means we are dealing with WIG instruction. */
3605 else if (!w)
3606 {
3607 if (evexwig == evexw1)
3608 w = 1;
3609 }
3610
3611 /* Encode the U bit. */
3612 implied_prefix |= 0x4;
3613
3614 /* The third byte of the EVEX prefix. */
3615 i.vex.bytes[2] = (w << 7 | register_specifier << 3 | implied_prefix);
3616
3617 /* The fourth byte of the EVEX prefix. */
3618 /* The zeroing-masking bit. */
3619 if (i.mask && i.mask->zeroing)
3620 i.vex.bytes[3] |= 0x80;
3621
3622 /* Don't always set the broadcast bit if there is no RC. */
3623 if (!i.rounding)
3624 {
3625 /* Encode the vector length. */
3626 unsigned int vec_length;
3627
3628 if (!i.tm.opcode_modifier.evex
3629 || i.tm.opcode_modifier.evex == EVEXDYN)
3630 {
3631 unsigned int op;
3632
3633 /* Determine vector length from the last multi-length vector
3634 operand. */
3635 vec_length = 0;
3636 for (op = i.operands; op--;)
3637 if (i.tm.operand_types[op].bitfield.xmmword
3638 + i.tm.operand_types[op].bitfield.ymmword
3639 + i.tm.operand_types[op].bitfield.zmmword > 1)
3640 {
3641 if (i.types[op].bitfield.zmmword)
3642 {
3643 i.tm.opcode_modifier.evex = EVEX512;
3644 break;
3645 }
3646 else if (i.types[op].bitfield.ymmword)
3647 {
3648 i.tm.opcode_modifier.evex = EVEX256;
3649 break;
3650 }
3651 else if (i.types[op].bitfield.xmmword)
3652 {
3653 i.tm.opcode_modifier.evex = EVEX128;
3654 break;
3655 }
3656 else if (i.broadcast && (int) op == i.broadcast->operand)
3657 {
3658 switch (i.broadcast->bytes)
3659 {
3660 case 64:
3661 i.tm.opcode_modifier.evex = EVEX512;
3662 break;
3663 case 32:
3664 i.tm.opcode_modifier.evex = EVEX256;
3665 break;
3666 case 16:
3667 i.tm.opcode_modifier.evex = EVEX128;
3668 break;
3669 default:
3670 abort ();
3671 }
3672 break;
3673 }
3674 }
3675
3676 if (op >= MAX_OPERANDS)
3677 abort ();
3678 }
3679
3680 switch (i.tm.opcode_modifier.evex)
3681 {
3682 case EVEXLIG: /* LL' is ignored */
3683 vec_length = evexlig << 5;
3684 break;
3685 case EVEX128:
3686 vec_length = 0 << 5;
3687 break;
3688 case EVEX256:
3689 vec_length = 1 << 5;
3690 break;
3691 case EVEX512:
3692 vec_length = 2 << 5;
3693 break;
3694 default:
3695 abort ();
3696 break;
3697 }
3698 i.vex.bytes[3] |= vec_length;
3699 /* Encode the broadcast bit. */
3700 if (i.broadcast)
3701 i.vex.bytes[3] |= 0x10;
3702 }
3703 else
3704 {
3705 if (i.rounding->type != saeonly)
3706 i.vex.bytes[3] |= 0x10 | (i.rounding->type << 5);
3707 else
3708 i.vex.bytes[3] |= 0x10 | (evexrcig << 5);
3709 }
3710
3711 if (i.mask && i.mask->mask)
3712 i.vex.bytes[3] |= i.mask->mask->reg_num;
3713 }
3714
3715 static void
3716 process_immext (void)
3717 {
3718 expressionS *exp;
3719
3720 if ((i.tm.cpu_flags.bitfield.cpusse3 || i.tm.cpu_flags.bitfield.cpusvme)
3721 && i.operands > 0)
3722 {
3723 /* MONITOR/MWAIT as well as SVME instructions have fixed operands
3724 with an opcode suffix which is coded in the same place as an
3725 8-bit immediate field would be.
3726 Here we check those operands and remove them afterwards. */
3727 unsigned int x;
3728
3729 for (x = 0; x < i.operands; x++)
3730 if (register_number (i.op[x].regs) != x)
3731 as_bad (_("can't use register '%s%s' as operand %d in '%s'."),
3732 register_prefix, i.op[x].regs->reg_name, x + 1,
3733 i.tm.name);
3734
3735 i.operands = 0;
3736 }
3737
3738 if (i.tm.cpu_flags.bitfield.cpumwaitx && i.operands > 0)
3739 {
3740 /* MONITORX/MWAITX instructions have fixed operands with an opcode
3741 suffix which is coded in the same place as an 8-bit immediate
3742 field would be.
3743 Here we check those operands and remove them afterwards. */
3744 unsigned int x;
3745
3746 if (i.operands != 3)
3747 abort();
3748
3749 for (x = 0; x < 2; x++)
3750 if (register_number (i.op[x].regs) != x)
3751 goto bad_register_operand;
3752
3753 /* Check for third operand for mwaitx/monitorx insn. */
3754 if (register_number (i.op[x].regs)
3755 != (x + (i.tm.extension_opcode == 0xfb)))
3756 {
3757 bad_register_operand:
3758 as_bad (_("can't use register '%s%s' as operand %d in '%s'."),
3759 register_prefix, i.op[x].regs->reg_name, x+1,
3760 i.tm.name);
3761 }
3762
3763 i.operands = 0;
3764 }
3765
3766 /* These AMD 3DNow! and SSE2 instructions have an opcode suffix
3767 which is coded in the same place as an 8-bit immediate field
3768 would be. Here we fake an 8-bit immediate operand from the
3769 opcode suffix stored in tm.extension_opcode.
3770
3771 AVX instructions also use this encoding, for some of
3772 3 argument instructions. */
3773
3774 gas_assert (i.imm_operands <= 1
3775 && (i.operands <= 2
3776 || (is_any_vex_encoding (&i.tm)
3777 && i.operands <= 4)));
3778
3779 exp = &im_expressions[i.imm_operands++];
3780 i.op[i.operands].imms = exp;
3781 i.types[i.operands] = imm8;
3782 i.operands++;
3783 exp->X_op = O_constant;
3784 exp->X_add_number = i.tm.extension_opcode;
3785 i.tm.extension_opcode = None;
3786 }
3787
3788
3789 static int
3790 check_hle (void)
3791 {
3792 switch (i.tm.opcode_modifier.hleprefixok)
3793 {
3794 default:
3795 abort ();
3796 case HLEPrefixNone:
3797 as_bad (_("invalid instruction `%s' after `%s'"),
3798 i.tm.name, i.hle_prefix);
3799 return 0;
3800 case HLEPrefixLock:
3801 if (i.prefix[LOCK_PREFIX])
3802 return 1;
3803 as_bad (_("missing `lock' with `%s'"), i.hle_prefix);
3804 return 0;
3805 case HLEPrefixAny:
3806 return 1;
3807 case HLEPrefixRelease:
3808 if (i.prefix[HLE_PREFIX] != XRELEASE_PREFIX_OPCODE)
3809 {
3810 as_bad (_("instruction `%s' after `xacquire' not allowed"),
3811 i.tm.name);
3812 return 0;
3813 }
3814 if (i.mem_operands == 0
3815 || !operand_type_check (i.types[i.operands - 1], anymem))
3816 {
3817 as_bad (_("memory destination needed for instruction `%s'"
3818 " after `xrelease'"), i.tm.name);
3819 return 0;
3820 }
3821 return 1;
3822 }
3823 }
3824
3825 /* Try the shortest encoding by shortening operand size. */
3826
3827 static void
3828 optimize_encoding (void)
3829 {
3830 int j;
3831
3832 if (optimize_for_space
3833 && i.reg_operands == 1
3834 && i.imm_operands == 1
3835 && !i.types[1].bitfield.byte
3836 && i.op[0].imms->X_op == O_constant
3837 && fits_in_imm7 (i.op[0].imms->X_add_number)
3838 && ((i.tm.base_opcode == 0xa8
3839 && i.tm.extension_opcode == None)
3840 || (i.tm.base_opcode == 0xf6
3841 && i.tm.extension_opcode == 0x0)))
3842 {
3843 /* Optimize: -Os:
3844 test $imm7, %r64/%r32/%r16 -> test $imm7, %r8
3845 */
3846 unsigned int base_regnum = i.op[1].regs->reg_num;
3847 if (flag_code == CODE_64BIT || base_regnum < 4)
3848 {
3849 i.types[1].bitfield.byte = 1;
3850 /* Ignore the suffix. */
3851 i.suffix = 0;
3852 if (base_regnum >= 4
3853 && !(i.op[1].regs->reg_flags & RegRex))
3854 {
3855 /* Handle SP, BP, SI and DI registers. */
3856 if (i.types[1].bitfield.word)
3857 j = 16;
3858 else if (i.types[1].bitfield.dword)
3859 j = 32;
3860 else
3861 j = 48;
3862 i.op[1].regs -= j;
3863 }
3864 }
3865 }
3866 else if (flag_code == CODE_64BIT
3867 && ((i.types[1].bitfield.qword
3868 && i.reg_operands == 1
3869 && i.imm_operands == 1
3870 && i.op[0].imms->X_op == O_constant
3871 && ((i.tm.base_opcode == 0xb0
3872 && i.tm.extension_opcode == None
3873 && fits_in_unsigned_long (i.op[0].imms->X_add_number))
3874 || (fits_in_imm31 (i.op[0].imms->X_add_number)
3875 && (((i.tm.base_opcode == 0x24
3876 || i.tm.base_opcode == 0xa8)
3877 && i.tm.extension_opcode == None)
3878 || (i.tm.base_opcode == 0x80
3879 && i.tm.extension_opcode == 0x4)
3880 || ((i.tm.base_opcode == 0xf6
3881 || i.tm.base_opcode == 0xc6)
3882 && i.tm.extension_opcode == 0x0)))))
3883 || (i.types[0].bitfield.qword
3884 && ((i.reg_operands == 2
3885 && i.op[0].regs == i.op[1].regs
3886 && ((i.tm.base_opcode == 0x30
3887 || i.tm.base_opcode == 0x28)
3888 && i.tm.extension_opcode == None))
3889 || (i.reg_operands == 1
3890 && i.operands == 1
3891 && i.tm.base_opcode == 0x30
3892 && i.tm.extension_opcode == None)))))
3893 {
3894 /* Optimize: -O:
3895 andq $imm31, %r64 -> andl $imm31, %r32
3896 testq $imm31, %r64 -> testl $imm31, %r32
3897 xorq %r64, %r64 -> xorl %r32, %r32
3898 subq %r64, %r64 -> subl %r32, %r32
3899 movq $imm31, %r64 -> movl $imm31, %r32
3900 movq $imm32, %r64 -> movl $imm32, %r32
3901 */
3902 i.tm.opcode_modifier.norex64 = 1;
3903 if (i.tm.base_opcode == 0xb0 || i.tm.base_opcode == 0xc6)
3904 {
3905 /* Handle
3906 movq $imm31, %r64 -> movl $imm31, %r32
3907 movq $imm32, %r64 -> movl $imm32, %r32
3908 */
3909 i.tm.operand_types[0].bitfield.imm32 = 1;
3910 i.tm.operand_types[0].bitfield.imm32s = 0;
3911 i.tm.operand_types[0].bitfield.imm64 = 0;
3912 i.types[0].bitfield.imm32 = 1;
3913 i.types[0].bitfield.imm32s = 0;
3914 i.types[0].bitfield.imm64 = 0;
3915 i.types[1].bitfield.dword = 1;
3916 i.types[1].bitfield.qword = 0;
3917 if (i.tm.base_opcode == 0xc6)
3918 {
3919 /* Handle
3920 movq $imm31, %r64 -> movl $imm31, %r32
3921 */
3922 i.tm.base_opcode = 0xb0;
3923 i.tm.extension_opcode = None;
3924 i.tm.opcode_modifier.shortform = 1;
3925 i.tm.opcode_modifier.modrm = 0;
3926 }
3927 }
3928 }
3929 else if (optimize > 1
3930 && i.reg_operands == 3
3931 && i.op[0].regs == i.op[1].regs
3932 && !i.types[2].bitfield.xmmword
3933 && (i.tm.opcode_modifier.vex
3934 || ((!i.mask || i.mask->zeroing)
3935 && !i.rounding
3936 && is_evex_encoding (&i.tm)
3937 && (i.vec_encoding != vex_encoding_evex
3938 || i.tm.cpu_flags.bitfield.cpuavx512vl
3939 || (i.tm.operand_types[2].bitfield.zmmword
3940 && i.types[2].bitfield.ymmword)
3941 || cpu_arch_isa_flags.bitfield.cpuavx512vl)))
3942 && ((i.tm.base_opcode == 0x55
3943 || i.tm.base_opcode == 0x6655
3944 || i.tm.base_opcode == 0x66df
3945 || i.tm.base_opcode == 0x57
3946 || i.tm.base_opcode == 0x6657
3947 || i.tm.base_opcode == 0x66ef
3948 || i.tm.base_opcode == 0x66f8
3949 || i.tm.base_opcode == 0x66f9
3950 || i.tm.base_opcode == 0x66fa
3951 || i.tm.base_opcode == 0x66fb
3952 || i.tm.base_opcode == 0x42
3953 || i.tm.base_opcode == 0x6642
3954 || i.tm.base_opcode == 0x47
3955 || i.tm.base_opcode == 0x6647)
3956 && i.tm.extension_opcode == None))
3957 {
3958 /* Optimize: -O2:
3959 VOP, one of vandnps, vandnpd, vxorps, vxorpd, vpsubb, vpsubd,
3960 vpsubq and vpsubw:
3961 EVEX VOP %zmmM, %zmmM, %zmmN
3962 -> VEX VOP %xmmM, %xmmM, %xmmN (M and N < 16)
3963 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16)
3964 EVEX VOP %ymmM, %ymmM, %ymmN
3965 -> VEX VOP %xmmM, %xmmM, %xmmN (M and N < 16)
3966 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16)
3967 VEX VOP %ymmM, %ymmM, %ymmN
3968 -> VEX VOP %xmmM, %xmmM, %xmmN
3969 VOP, one of vpandn and vpxor:
3970 VEX VOP %ymmM, %ymmM, %ymmN
3971 -> VEX VOP %xmmM, %xmmM, %xmmN
3972 VOP, one of vpandnd and vpandnq:
3973 EVEX VOP %zmmM, %zmmM, %zmmN
3974 -> VEX vpandn %xmmM, %xmmM, %xmmN (M and N < 16)
3975 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16)
3976 EVEX VOP %ymmM, %ymmM, %ymmN
3977 -> VEX vpandn %xmmM, %xmmM, %xmmN (M and N < 16)
3978 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16)
3979 VOP, one of vpxord and vpxorq:
3980 EVEX VOP %zmmM, %zmmM, %zmmN
3981 -> VEX vpxor %xmmM, %xmmM, %xmmN (M and N < 16)
3982 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16)
3983 EVEX VOP %ymmM, %ymmM, %ymmN
3984 -> VEX vpxor %xmmM, %xmmM, %xmmN (M and N < 16)
3985 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16)
3986 VOP, one of kxord and kxorq:
3987 VEX VOP %kM, %kM, %kN
3988 -> VEX kxorw %kM, %kM, %kN
3989 VOP, one of kandnd and kandnq:
3990 VEX VOP %kM, %kM, %kN
3991 -> VEX kandnw %kM, %kM, %kN
3992 */
3993 if (is_evex_encoding (&i.tm))
3994 {
3995 if (i.vec_encoding == vex_encoding_evex)
3996 i.tm.opcode_modifier.evex = EVEX128;
3997 else
3998 {
3999 i.tm.opcode_modifier.vex = VEX128;
4000 i.tm.opcode_modifier.vexw = VEXW0;
4001 i.tm.opcode_modifier.evex = 0;
4002 }
4003 }
4004 else if (i.tm.operand_types[0].bitfield.regmask)
4005 {
4006 i.tm.base_opcode &= 0xff;
4007 i.tm.opcode_modifier.vexw = VEXW0;
4008 }
4009 else
4010 i.tm.opcode_modifier.vex = VEX128;
4011
4012 if (i.tm.opcode_modifier.vex)
4013 for (j = 0; j < 3; j++)
4014 {
4015 i.types[j].bitfield.xmmword = 1;
4016 i.types[j].bitfield.ymmword = 0;
4017 }
4018 }
4019 }
4020
4021 /* This is the guts of the machine-dependent assembler. LINE points to a
4022 machine dependent instruction. This function is supposed to emit
4023 the frags/bytes it assembles to. */
4024
4025 void
4026 md_assemble (char *line)
4027 {
4028 unsigned int j;
4029 char mnemonic[MAX_MNEM_SIZE], mnem_suffix;
4030 const insn_template *t;
4031
4032 /* Initialize globals. */
4033 memset (&i, '\0', sizeof (i));
4034 for (j = 0; j < MAX_OPERANDS; j++)
4035 i.reloc[j] = NO_RELOC;
4036 memset (disp_expressions, '\0', sizeof (disp_expressions));
4037 memset (im_expressions, '\0', sizeof (im_expressions));
4038 save_stack_p = save_stack;
4039
4040 /* First parse an instruction mnemonic & call i386_operand for the operands.
4041 We assume that the scrubber has arranged it so that line[0] is the valid
4042 start of a (possibly prefixed) mnemonic. */
4043
4044 line = parse_insn (line, mnemonic);
4045 if (line == NULL)
4046 return;
4047 mnem_suffix = i.suffix;
4048
4049 line = parse_operands (line, mnemonic);
4050 this_operand = -1;
4051 xfree (i.memop1_string);
4052 i.memop1_string = NULL;
4053 if (line == NULL)
4054 return;
4055
4056 /* Now we've parsed the mnemonic into a set of templates, and have the
4057 operands at hand. */
4058
4059 /* All intel opcodes have reversed operands except for "bound" and
4060 "enter". We also don't reverse intersegment "jmp" and "call"
4061 instructions with 2 immediate operands so that the immediate segment
4062 precedes the offset, as it does when in AT&T mode. */
4063 if (intel_syntax
4064 && i.operands > 1
4065 && (strcmp (mnemonic, "bound") != 0)
4066 && (strcmp (mnemonic, "invlpga") != 0)
4067 && !(operand_type_check (i.types[0], imm)
4068 && operand_type_check (i.types[1], imm)))
4069 swap_operands ();
4070
4071 /* The order of the immediates should be reversed
4072 for 2 immediates extrq and insertq instructions */
4073 if (i.imm_operands == 2
4074 && (strcmp (mnemonic, "extrq") == 0
4075 || strcmp (mnemonic, "insertq") == 0))
4076 swap_2_operands (0, 1);
4077
4078 if (i.imm_operands)
4079 optimize_imm ();
4080
4081 /* Don't optimize displacement for movabs since it only takes 64bit
4082 displacement. */
4083 if (i.disp_operands
4084 && i.disp_encoding != disp_encoding_32bit
4085 && (flag_code != CODE_64BIT
4086 || strcmp (mnemonic, "movabs") != 0))
4087 optimize_disp ();
4088
4089 /* Next, we find a template that matches the given insn,
4090 making sure the overlap of the given operands types is consistent
4091 with the template operand types. */
4092
4093 if (!(t = match_template (mnem_suffix)))
4094 return;
4095
4096 if (sse_check != check_none
4097 && !i.tm.opcode_modifier.noavx
4098 && !i.tm.cpu_flags.bitfield.cpuavx
4099 && (i.tm.cpu_flags.bitfield.cpusse
4100 || i.tm.cpu_flags.bitfield.cpusse2
4101 || i.tm.cpu_flags.bitfield.cpusse3
4102 || i.tm.cpu_flags.bitfield.cpussse3
4103 || i.tm.cpu_flags.bitfield.cpusse4_1
4104 || i.tm.cpu_flags.bitfield.cpusse4_2
4105 || i.tm.cpu_flags.bitfield.cpupclmul
4106 || i.tm.cpu_flags.bitfield.cpuaes
4107 || i.tm.cpu_flags.bitfield.cpugfni))
4108 {
4109 (sse_check == check_warning
4110 ? as_warn
4111 : as_bad) (_("SSE instruction `%s' is used"), i.tm.name);
4112 }
4113
4114 /* Zap movzx and movsx suffix. The suffix has been set from
4115 "word ptr" or "byte ptr" on the source operand in Intel syntax
4116 or extracted from mnemonic in AT&T syntax. But we'll use
4117 the destination register to choose the suffix for encoding. */
4118 if ((i.tm.base_opcode & ~9) == 0x0fb6)
4119 {
4120 /* In Intel syntax, there must be a suffix. In AT&T syntax, if
4121 there is no suffix, the default will be byte extension. */
4122 if (i.reg_operands != 2
4123 && !i.suffix
4124 && intel_syntax)
4125 as_bad (_("ambiguous operand size for `%s'"), i.tm.name);
4126
4127 i.suffix = 0;
4128 }
4129
4130 if (i.tm.opcode_modifier.fwait)
4131 if (!add_prefix (FWAIT_OPCODE))
4132 return;
4133
4134 /* Check if REP prefix is OK. */
4135 if (i.rep_prefix && !i.tm.opcode_modifier.repprefixok)
4136 {
4137 as_bad (_("invalid instruction `%s' after `%s'"),
4138 i.tm.name, i.rep_prefix);
4139 return;
4140 }
4141
4142 /* Check for lock without a lockable instruction. Destination operand
4143 must be memory unless it is xchg (0x86). */
4144 if (i.prefix[LOCK_PREFIX]
4145 && (!i.tm.opcode_modifier.islockable
4146 || i.mem_operands == 0
4147 || (i.tm.base_opcode != 0x86
4148 && !operand_type_check (i.types[i.operands - 1], anymem))))
4149 {
4150 as_bad (_("expecting lockable instruction after `lock'"));
4151 return;
4152 }
4153
4154 /* Check for data size prefix on VEX/XOP/EVEX encoded insns. */
4155 if (i.prefix[DATA_PREFIX] && is_any_vex_encoding (&i.tm))
4156 {
4157 as_bad (_("data size prefix invalid with `%s'"), i.tm.name);
4158 return;
4159 }
4160
4161 /* Check if HLE prefix is OK. */
4162 if (i.hle_prefix && !check_hle ())
4163 return;
4164
4165 /* Check BND prefix. */
4166 if (i.bnd_prefix && !i.tm.opcode_modifier.bndprefixok)
4167 as_bad (_("expecting valid branch instruction after `bnd'"));
4168
4169 /* Check NOTRACK prefix. */
4170 if (i.notrack_prefix && !i.tm.opcode_modifier.notrackprefixok)
4171 as_bad (_("expecting indirect branch instruction after `notrack'"));
4172
4173 if (i.tm.cpu_flags.bitfield.cpumpx)
4174 {
4175 if (flag_code == CODE_64BIT && i.prefix[ADDR_PREFIX])
4176 as_bad (_("32-bit address isn't allowed in 64-bit MPX instructions."));
4177 else if (flag_code != CODE_16BIT
4178 ? i.prefix[ADDR_PREFIX]
4179 : i.mem_operands && !i.prefix[ADDR_PREFIX])
4180 as_bad (_("16-bit address isn't allowed in MPX instructions"));
4181 }
4182
4183 /* Insert BND prefix. */
4184 if (add_bnd_prefix && i.tm.opcode_modifier.bndprefixok)
4185 {
4186 if (!i.prefix[BND_PREFIX])
4187 add_prefix (BND_PREFIX_OPCODE);
4188 else if (i.prefix[BND_PREFIX] != BND_PREFIX_OPCODE)
4189 {
4190 as_warn (_("replacing `rep'/`repe' prefix by `bnd'"));
4191 i.prefix[BND_PREFIX] = BND_PREFIX_OPCODE;
4192 }
4193 }
4194
4195 /* Check string instruction segment overrides. */
4196 if (i.tm.opcode_modifier.isstring && i.mem_operands != 0)
4197 {
4198 if (!check_string ())
4199 return;
4200 i.disp_operands = 0;
4201 }
4202
4203 if (optimize && !i.no_optimize && i.tm.opcode_modifier.optimize)
4204 optimize_encoding ();
4205
4206 if (!process_suffix ())
4207 return;
4208
4209 /* Update operand types. */
4210 for (j = 0; j < i.operands; j++)
4211 i.types[j] = operand_type_and (i.types[j], i.tm.operand_types[j]);
4212
4213 /* Make still unresolved immediate matches conform to size of immediate
4214 given in i.suffix. */
4215 if (!finalize_imm ())
4216 return;
4217
4218 if (i.types[0].bitfield.imm1)
4219 i.imm_operands = 0; /* kludge for shift insns. */
4220
4221 /* We only need to check those implicit registers for instructions
4222 with 3 operands or less. */
4223 if (i.operands <= 3)
4224 for (j = 0; j < i.operands; j++)
4225 if (i.types[j].bitfield.inoutportreg
4226 || i.types[j].bitfield.shiftcount
4227 || (i.types[j].bitfield.acc && !i.types[j].bitfield.xmmword))
4228 i.reg_operands--;
4229
4230 /* ImmExt should be processed after SSE2AVX. */
4231 if (!i.tm.opcode_modifier.sse2avx
4232 && i.tm.opcode_modifier.immext)
4233 process_immext ();
4234
4235 /* For insns with operands there are more diddles to do to the opcode. */
4236 if (i.operands)
4237 {
4238 if (!process_operands ())
4239 return;
4240 }
4241 else if (!quiet_warnings && i.tm.opcode_modifier.ugh)
4242 {
4243 /* UnixWare fsub no args is alias for fsubp, fadd -> faddp, etc. */
4244 as_warn (_("translating to `%sp'"), i.tm.name);
4245 }
4246
4247 if (is_any_vex_encoding (&i.tm))
4248 {
4249 if (flag_code == CODE_16BIT)
4250 {
4251 as_bad (_("instruction `%s' isn't supported in 16-bit mode."),
4252 i.tm.name);
4253 return;
4254 }
4255
4256 if (i.tm.opcode_modifier.vex)
4257 build_vex_prefix (t);
4258 else
4259 build_evex_prefix ();
4260 }
4261
4262 /* Handle conversion of 'int $3' --> special int3 insn. XOP or FMA4
4263 instructions may define INT_OPCODE as well, so avoid this corner
4264 case for those instructions that use MODRM. */
4265 if (i.tm.base_opcode == INT_OPCODE
4266 && !i.tm.opcode_modifier.modrm
4267 && i.op[0].imms->X_add_number == 3)
4268 {
4269 i.tm.base_opcode = INT3_OPCODE;
4270 i.imm_operands = 0;
4271 }
4272
4273 if ((i.tm.opcode_modifier.jump
4274 || i.tm.opcode_modifier.jumpbyte
4275 || i.tm.opcode_modifier.jumpdword)
4276 && i.op[0].disps->X_op == O_constant)
4277 {
4278 /* Convert "jmp constant" (and "call constant") to a jump (call) to
4279 the absolute address given by the constant. Since ix86 jumps and
4280 calls are pc relative, we need to generate a reloc. */
4281 i.op[0].disps->X_add_symbol = &abs_symbol;
4282 i.op[0].disps->X_op = O_symbol;
4283 }
4284
4285 if (i.tm.opcode_modifier.rex64)
4286 i.rex |= REX_W;
4287
4288 /* For 8 bit registers we need an empty rex prefix. Also if the
4289 instruction already has a prefix, we need to convert old
4290 registers to new ones. */
4291
4292 if ((i.types[0].bitfield.reg && i.types[0].bitfield.byte
4293 && (i.op[0].regs->reg_flags & RegRex64) != 0)
4294 || (i.types[1].bitfield.reg && i.types[1].bitfield.byte
4295 && (i.op[1].regs->reg_flags & RegRex64) != 0)
4296 || (((i.types[0].bitfield.reg && i.types[0].bitfield.byte)
4297 || (i.types[1].bitfield.reg && i.types[1].bitfield.byte))
4298 && i.rex != 0))
4299 {
4300 int x;
4301
4302 i.rex |= REX_OPCODE;
4303 for (x = 0; x < 2; x++)
4304 {
4305 /* Look for 8 bit operand that uses old registers. */
4306 if (i.types[x].bitfield.reg && i.types[x].bitfield.byte
4307 && (i.op[x].regs->reg_flags & RegRex64) == 0)
4308 {
4309 /* In case it is "hi" register, give up. */
4310 if (i.op[x].regs->reg_num > 3)
4311 as_bad (_("can't encode register '%s%s' in an "
4312 "instruction requiring REX prefix."),
4313 register_prefix, i.op[x].regs->reg_name);
4314
4315 /* Otherwise it is equivalent to the extended register.
4316 Since the encoding doesn't change this is merely
4317 cosmetic cleanup for debug output. */
4318
4319 i.op[x].regs = i.op[x].regs + 8;
4320 }
4321 }
4322 }
4323
4324 if (i.rex == 0 && i.rex_encoding)
4325 {
4326 /* Check if we can add a REX_OPCODE byte. Look for 8 bit operand
4327 that uses legacy register. If it is "hi" register, don't add
4328 the REX_OPCODE byte. */
4329 int x;
4330 for (x = 0; x < 2; x++)
4331 if (i.types[x].bitfield.reg
4332 && i.types[x].bitfield.byte
4333 && (i.op[x].regs->reg_flags & RegRex64) == 0
4334 && i.op[x].regs->reg_num > 3)
4335 {
4336 i.rex_encoding = FALSE;
4337 break;
4338 }
4339
4340 if (i.rex_encoding)
4341 i.rex = REX_OPCODE;
4342 }
4343
4344 if (i.rex != 0)
4345 add_prefix (REX_OPCODE | i.rex);
4346
4347 /* We are ready to output the insn. */
4348 output_insn ();
4349 }
4350
4351 static char *
4352 parse_insn (char *line, char *mnemonic)
4353 {
4354 char *l = line;
4355 char *token_start = l;
4356 char *mnem_p;
4357 int supported;
4358 const insn_template *t;
4359 char *dot_p = NULL;
4360
4361 while (1)
4362 {
4363 mnem_p = mnemonic;
4364 while ((*mnem_p = mnemonic_chars[(unsigned char) *l]) != 0)
4365 {
4366 if (*mnem_p == '.')
4367 dot_p = mnem_p;
4368 mnem_p++;
4369 if (mnem_p >= mnemonic + MAX_MNEM_SIZE)
4370 {
4371 as_bad (_("no such instruction: `%s'"), token_start);
4372 return NULL;
4373 }
4374 l++;
4375 }
4376 if (!is_space_char (*l)
4377 && *l != END_OF_INSN
4378 && (intel_syntax
4379 || (*l != PREFIX_SEPARATOR
4380 && *l != ',')))
4381 {
4382 as_bad (_("invalid character %s in mnemonic"),
4383 output_invalid (*l));
4384 return NULL;
4385 }
4386 if (token_start == l)
4387 {
4388 if (!intel_syntax && *l == PREFIX_SEPARATOR)
4389 as_bad (_("expecting prefix; got nothing"));
4390 else
4391 as_bad (_("expecting mnemonic; got nothing"));
4392 return NULL;
4393 }
4394
4395 /* Look up instruction (or prefix) via hash table. */
4396 current_templates = (const templates *) hash_find (op_hash, mnemonic);
4397
4398 if (*l != END_OF_INSN
4399 && (!is_space_char (*l) || l[1] != END_OF_INSN)
4400 && current_templates
4401 && current_templates->start->opcode_modifier.isprefix)
4402 {
4403 if (!cpu_flags_check_cpu64 (current_templates->start->cpu_flags))
4404 {
4405 as_bad ((flag_code != CODE_64BIT
4406 ? _("`%s' is only supported in 64-bit mode")
4407 : _("`%s' is not supported in 64-bit mode")),
4408 current_templates->start->name);
4409 return NULL;
4410 }
4411 /* If we are in 16-bit mode, do not allow addr16 or data16.
4412 Similarly, in 32-bit mode, do not allow addr32 or data32. */
4413 if ((current_templates->start->opcode_modifier.size16
4414 || current_templates->start->opcode_modifier.size32)
4415 && flag_code != CODE_64BIT
4416 && (current_templates->start->opcode_modifier.size32
4417 ^ (flag_code == CODE_16BIT)))
4418 {
4419 as_bad (_("redundant %s prefix"),
4420 current_templates->start->name);
4421 return NULL;
4422 }
4423 if (current_templates->start->opcode_length == 0)
4424 {
4425 /* Handle pseudo prefixes. */
4426 switch (current_templates->start->base_opcode)
4427 {
4428 case 0x0:
4429 /* {disp8} */
4430 i.disp_encoding = disp_encoding_8bit;
4431 break;
4432 case 0x1:
4433 /* {disp32} */
4434 i.disp_encoding = disp_encoding_32bit;
4435 break;
4436 case 0x2:
4437 /* {load} */
4438 i.dir_encoding = dir_encoding_load;
4439 break;
4440 case 0x3:
4441 /* {store} */
4442 i.dir_encoding = dir_encoding_store;
4443 break;
4444 case 0x4:
4445 /* {vex2} */
4446 i.vec_encoding = vex_encoding_vex2;
4447 break;
4448 case 0x5:
4449 /* {vex3} */
4450 i.vec_encoding = vex_encoding_vex3;
4451 break;
4452 case 0x6:
4453 /* {evex} */
4454 i.vec_encoding = vex_encoding_evex;
4455 break;
4456 case 0x7:
4457 /* {rex} */
4458 i.rex_encoding = TRUE;
4459 break;
4460 case 0x8:
4461 /* {nooptimize} */
4462 i.no_optimize = TRUE;
4463 break;
4464 default:
4465 abort ();
4466 }
4467 }
4468 else
4469 {
4470 /* Add prefix, checking for repeated prefixes. */
4471 switch (add_prefix (current_templates->start->base_opcode))
4472 {
4473 case PREFIX_EXIST:
4474 return NULL;
4475 case PREFIX_DS:
4476 if (current_templates->start->cpu_flags.bitfield.cpuibt)
4477 i.notrack_prefix = current_templates->start->name;
4478 break;
4479 case PREFIX_REP:
4480 if (current_templates->start->cpu_flags.bitfield.cpuhle)
4481 i.hle_prefix = current_templates->start->name;
4482 else if (current_templates->start->cpu_flags.bitfield.cpumpx)
4483 i.bnd_prefix = current_templates->start->name;
4484 else
4485 i.rep_prefix = current_templates->start->name;
4486 break;
4487 default:
4488 break;
4489 }
4490 }
4491 /* Skip past PREFIX_SEPARATOR and reset token_start. */
4492 token_start = ++l;
4493 }
4494 else
4495 break;
4496 }
4497
4498 if (!current_templates)
4499 {
4500 /* Check if we should swap operand or force 32bit displacement in
4501 encoding. */
4502 if (mnem_p - 2 == dot_p && dot_p[1] == 's')
4503 i.dir_encoding = dir_encoding_store;
4504 else if (mnem_p - 3 == dot_p
4505 && dot_p[1] == 'd'
4506 && dot_p[2] == '8')
4507 i.disp_encoding = disp_encoding_8bit;
4508 else if (mnem_p - 4 == dot_p
4509 && dot_p[1] == 'd'
4510 && dot_p[2] == '3'
4511 && dot_p[3] == '2')
4512 i.disp_encoding = disp_encoding_32bit;
4513 else
4514 goto check_suffix;
4515 mnem_p = dot_p;
4516 *dot_p = '\0';
4517 current_templates = (const templates *) hash_find (op_hash, mnemonic);
4518 }
4519
4520 if (!current_templates)
4521 {
4522 check_suffix:
4523 /* See if we can get a match by trimming off a suffix. */
4524 switch (mnem_p[-1])
4525 {
4526 case WORD_MNEM_SUFFIX:
4527 if (intel_syntax && (intel_float_operand (mnemonic) & 2))
4528 i.suffix = SHORT_MNEM_SUFFIX;
4529 else
4530 /* Fall through. */
4531 case BYTE_MNEM_SUFFIX:
4532 case QWORD_MNEM_SUFFIX:
4533 i.suffix = mnem_p[-1];
4534 mnem_p[-1] = '\0';
4535 current_templates = (const templates *) hash_find (op_hash,
4536 mnemonic);
4537 break;
4538 case SHORT_MNEM_SUFFIX:
4539 case LONG_MNEM_SUFFIX:
4540 if (!intel_syntax)
4541 {
4542 i.suffix = mnem_p[-1];
4543 mnem_p[-1] = '\0';
4544 current_templates = (const templates *) hash_find (op_hash,
4545 mnemonic);
4546 }
4547 break;
4548
4549 /* Intel Syntax. */
4550 case 'd':
4551 if (intel_syntax)
4552 {
4553 if (intel_float_operand (mnemonic) == 1)
4554 i.suffix = SHORT_MNEM_SUFFIX;
4555 else
4556 i.suffix = LONG_MNEM_SUFFIX;
4557 mnem_p[-1] = '\0';
4558 current_templates = (const templates *) hash_find (op_hash,
4559 mnemonic);
4560 }
4561 break;
4562 }
4563 if (!current_templates)
4564 {
4565 as_bad (_("no such instruction: `%s'"), token_start);
4566 return NULL;
4567 }
4568 }
4569
4570 if (current_templates->start->opcode_modifier.jump
4571 || current_templates->start->opcode_modifier.jumpbyte)
4572 {
4573 /* Check for a branch hint. We allow ",pt" and ",pn" for
4574 predict taken and predict not taken respectively.
4575 I'm not sure that branch hints actually do anything on loop
4576 and jcxz insns (JumpByte) for current Pentium4 chips. They
4577 may work in the future and it doesn't hurt to accept them
4578 now. */
4579 if (l[0] == ',' && l[1] == 'p')
4580 {
4581 if (l[2] == 't')
4582 {
4583 if (!add_prefix (DS_PREFIX_OPCODE))
4584 return NULL;
4585 l += 3;
4586 }
4587 else if (l[2] == 'n')
4588 {
4589 if (!add_prefix (CS_PREFIX_OPCODE))
4590 return NULL;
4591 l += 3;
4592 }
4593 }
4594 }
4595 /* Any other comma loses. */
4596 if (*l == ',')
4597 {
4598 as_bad (_("invalid character %s in mnemonic"),
4599 output_invalid (*l));
4600 return NULL;
4601 }
4602
4603 /* Check if instruction is supported on specified architecture. */
4604 supported = 0;
4605 for (t = current_templates->start; t < current_templates->end; ++t)
4606 {
4607 supported |= cpu_flags_match (t);
4608 if (supported == CPU_FLAGS_PERFECT_MATCH)
4609 {
4610 if (!cpu_arch_flags.bitfield.cpui386 && (flag_code != CODE_16BIT))
4611 as_warn (_("use .code16 to ensure correct addressing mode"));
4612
4613 return l;
4614 }
4615 }
4616
4617 if (!(supported & CPU_FLAGS_64BIT_MATCH))
4618 as_bad (flag_code == CODE_64BIT
4619 ? _("`%s' is not supported in 64-bit mode")
4620 : _("`%s' is only supported in 64-bit mode"),
4621 current_templates->start->name);
4622 else
4623 as_bad (_("`%s' is not supported on `%s%s'"),
4624 current_templates->start->name,
4625 cpu_arch_name ? cpu_arch_name : default_arch,
4626 cpu_sub_arch_name ? cpu_sub_arch_name : "");
4627
4628 return NULL;
4629 }
4630
4631 static char *
4632 parse_operands (char *l, const char *mnemonic)
4633 {
4634 char *token_start;
4635
4636 /* 1 if operand is pending after ','. */
4637 unsigned int expecting_operand = 0;
4638
4639 /* Non-zero if operand parens not balanced. */
4640 unsigned int paren_not_balanced;
4641
4642 while (*l != END_OF_INSN)
4643 {
4644 /* Skip optional white space before operand. */
4645 if (is_space_char (*l))
4646 ++l;
4647 if (!is_operand_char (*l) && *l != END_OF_INSN && *l != '"')
4648 {
4649 as_bad (_("invalid character %s before operand %d"),
4650 output_invalid (*l),
4651 i.operands + 1);
4652 return NULL;
4653 }
4654 token_start = l; /* After white space. */
4655 paren_not_balanced = 0;
4656 while (paren_not_balanced || *l != ',')
4657 {
4658 if (*l == END_OF_INSN)
4659 {
4660 if (paren_not_balanced)
4661 {
4662 if (!intel_syntax)
4663 as_bad (_("unbalanced parenthesis in operand %d."),
4664 i.operands + 1);
4665 else
4666 as_bad (_("unbalanced brackets in operand %d."),
4667 i.operands + 1);
4668 return NULL;
4669 }
4670 else
4671 break; /* we are done */
4672 }
4673 else if (!is_operand_char (*l) && !is_space_char (*l) && *l != '"')
4674 {
4675 as_bad (_("invalid character %s in operand %d"),
4676 output_invalid (*l),
4677 i.operands + 1);
4678 return NULL;
4679 }
4680 if (!intel_syntax)
4681 {
4682 if (*l == '(')
4683 ++paren_not_balanced;
4684 if (*l == ')')
4685 --paren_not_balanced;
4686 }
4687 else
4688 {
4689 if (*l == '[')
4690 ++paren_not_balanced;
4691 if (*l == ']')
4692 --paren_not_balanced;
4693 }
4694 l++;
4695 }
4696 if (l != token_start)
4697 { /* Yes, we've read in another operand. */
4698 unsigned int operand_ok;
4699 this_operand = i.operands++;
4700 if (i.operands > MAX_OPERANDS)
4701 {
4702 as_bad (_("spurious operands; (%d operands/instruction max)"),
4703 MAX_OPERANDS);
4704 return NULL;
4705 }
4706 i.types[this_operand].bitfield.unspecified = 1;
4707 /* Now parse operand adding info to 'i' as we go along. */
4708 END_STRING_AND_SAVE (l);
4709
4710 if (i.mem_operands > 1)
4711 {
4712 as_bad (_("too many memory references for `%s'"),
4713 mnemonic);
4714 return 0;
4715 }
4716
4717 if (intel_syntax)
4718 operand_ok =
4719 i386_intel_operand (token_start,
4720 intel_float_operand (mnemonic));
4721 else
4722 operand_ok = i386_att_operand (token_start);
4723
4724 RESTORE_END_STRING (l);
4725 if (!operand_ok)
4726 return NULL;
4727 }
4728 else
4729 {
4730 if (expecting_operand)
4731 {
4732 expecting_operand_after_comma:
4733 as_bad (_("expecting operand after ','; got nothing"));
4734 return NULL;
4735 }
4736 if (*l == ',')
4737 {
4738 as_bad (_("expecting operand before ','; got nothing"));
4739 return NULL;
4740 }
4741 }
4742
4743 /* Now *l must be either ',' or END_OF_INSN. */
4744 if (*l == ',')
4745 {
4746 if (*++l == END_OF_INSN)
4747 {
4748 /* Just skip it, if it's \n complain. */
4749 goto expecting_operand_after_comma;
4750 }
4751 expecting_operand = 1;
4752 }
4753 }
4754 return l;
4755 }
4756
4757 static void
4758 swap_2_operands (int xchg1, int xchg2)
4759 {
4760 union i386_op temp_op;
4761 i386_operand_type temp_type;
4762 unsigned int temp_flags;
4763 enum bfd_reloc_code_real temp_reloc;
4764
4765 temp_type = i.types[xchg2];
4766 i.types[xchg2] = i.types[xchg1];
4767 i.types[xchg1] = temp_type;
4768
4769 temp_flags = i.flags[xchg2];
4770 i.flags[xchg2] = i.flags[xchg1];
4771 i.flags[xchg1] = temp_flags;
4772
4773 temp_op = i.op[xchg2];
4774 i.op[xchg2] = i.op[xchg1];
4775 i.op[xchg1] = temp_op;
4776
4777 temp_reloc = i.reloc[xchg2];
4778 i.reloc[xchg2] = i.reloc[xchg1];
4779 i.reloc[xchg1] = temp_reloc;
4780
4781 if (i.mask)
4782 {
4783 if (i.mask->operand == xchg1)
4784 i.mask->operand = xchg2;
4785 else if (i.mask->operand == xchg2)
4786 i.mask->operand = xchg1;
4787 }
4788 if (i.broadcast)
4789 {
4790 if (i.broadcast->operand == xchg1)
4791 i.broadcast->operand = xchg2;
4792 else if (i.broadcast->operand == xchg2)
4793 i.broadcast->operand = xchg1;
4794 }
4795 if (i.rounding)
4796 {
4797 if (i.rounding->operand == xchg1)
4798 i.rounding->operand = xchg2;
4799 else if (i.rounding->operand == xchg2)
4800 i.rounding->operand = xchg1;
4801 }
4802 }
4803
4804 static void
4805 swap_operands (void)
4806 {
4807 switch (i.operands)
4808 {
4809 case 5:
4810 case 4:
4811 swap_2_operands (1, i.operands - 2);
4812 /* Fall through. */
4813 case 3:
4814 case 2:
4815 swap_2_operands (0, i.operands - 1);
4816 break;
4817 default:
4818 abort ();
4819 }
4820
4821 if (i.mem_operands == 2)
4822 {
4823 const seg_entry *temp_seg;
4824 temp_seg = i.seg[0];
4825 i.seg[0] = i.seg[1];
4826 i.seg[1] = temp_seg;
4827 }
4828 }
4829
4830 /* Try to ensure constant immediates are represented in the smallest
4831 opcode possible. */
4832 static void
4833 optimize_imm (void)
4834 {
4835 char guess_suffix = 0;
4836 int op;
4837
4838 if (i.suffix)
4839 guess_suffix = i.suffix;
4840 else if (i.reg_operands)
4841 {
4842 /* Figure out a suffix from the last register operand specified.
4843 We can't do this properly yet, ie. excluding InOutPortReg,
4844 but the following works for instructions with immediates.
4845 In any case, we can't set i.suffix yet. */
4846 for (op = i.operands; --op >= 0;)
4847 if (i.types[op].bitfield.reg && i.types[op].bitfield.byte)
4848 {
4849 guess_suffix = BYTE_MNEM_SUFFIX;
4850 break;
4851 }
4852 else if (i.types[op].bitfield.reg && i.types[op].bitfield.word)
4853 {
4854 guess_suffix = WORD_MNEM_SUFFIX;
4855 break;
4856 }
4857 else if (i.types[op].bitfield.reg && i.types[op].bitfield.dword)
4858 {
4859 guess_suffix = LONG_MNEM_SUFFIX;
4860 break;
4861 }
4862 else if (i.types[op].bitfield.reg && i.types[op].bitfield.qword)
4863 {
4864 guess_suffix = QWORD_MNEM_SUFFIX;
4865 break;
4866 }
4867 }
4868 else if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
4869 guess_suffix = WORD_MNEM_SUFFIX;
4870
4871 for (op = i.operands; --op >= 0;)
4872 if (operand_type_check (i.types[op], imm))
4873 {
4874 switch (i.op[op].imms->X_op)
4875 {
4876 case O_constant:
4877 /* If a suffix is given, this operand may be shortened. */
4878 switch (guess_suffix)
4879 {
4880 case LONG_MNEM_SUFFIX:
4881 i.types[op].bitfield.imm32 = 1;
4882 i.types[op].bitfield.imm64 = 1;
4883 break;
4884 case WORD_MNEM_SUFFIX:
4885 i.types[op].bitfield.imm16 = 1;
4886 i.types[op].bitfield.imm32 = 1;
4887 i.types[op].bitfield.imm32s = 1;
4888 i.types[op].bitfield.imm64 = 1;
4889 break;
4890 case BYTE_MNEM_SUFFIX:
4891 i.types[op].bitfield.imm8 = 1;
4892 i.types[op].bitfield.imm8s = 1;
4893 i.types[op].bitfield.imm16 = 1;
4894 i.types[op].bitfield.imm32 = 1;
4895 i.types[op].bitfield.imm32s = 1;
4896 i.types[op].bitfield.imm64 = 1;
4897 break;
4898 }
4899
4900 /* If this operand is at most 16 bits, convert it
4901 to a signed 16 bit number before trying to see
4902 whether it will fit in an even smaller size.
4903 This allows a 16-bit operand such as $0xffe0 to
4904 be recognised as within Imm8S range. */
4905 if ((i.types[op].bitfield.imm16)
4906 && (i.op[op].imms->X_add_number & ~(offsetT) 0xffff) == 0)
4907 {
4908 i.op[op].imms->X_add_number =
4909 (((i.op[op].imms->X_add_number & 0xffff) ^ 0x8000) - 0x8000);
4910 }
4911 #ifdef BFD64
4912 /* Store 32-bit immediate in 64-bit for 64-bit BFD. */
4913 if ((i.types[op].bitfield.imm32)
4914 && ((i.op[op].imms->X_add_number & ~(((offsetT) 2 << 31) - 1))
4915 == 0))
4916 {
4917 i.op[op].imms->X_add_number = ((i.op[op].imms->X_add_number
4918 ^ ((offsetT) 1 << 31))
4919 - ((offsetT) 1 << 31));
4920 }
4921 #endif
4922 i.types[op]
4923 = operand_type_or (i.types[op],
4924 smallest_imm_type (i.op[op].imms->X_add_number));
4925
4926 /* We must avoid matching of Imm32 templates when 64bit
4927 only immediate is available. */
4928 if (guess_suffix == QWORD_MNEM_SUFFIX)
4929 i.types[op].bitfield.imm32 = 0;
4930 break;
4931
4932 case O_absent:
4933 case O_register:
4934 abort ();
4935
4936 /* Symbols and expressions. */
4937 default:
4938 /* Convert symbolic operand to proper sizes for matching, but don't
4939 prevent matching a set of insns that only supports sizes other
4940 than those matching the insn suffix. */
4941 {
4942 i386_operand_type mask, allowed;
4943 const insn_template *t;
4944
4945 operand_type_set (&mask, 0);
4946 operand_type_set (&allowed, 0);
4947
4948 for (t = current_templates->start;
4949 t < current_templates->end;
4950 ++t)
4951 allowed = operand_type_or (allowed,
4952 t->operand_types[op]);
4953 switch (guess_suffix)
4954 {
4955 case QWORD_MNEM_SUFFIX:
4956 mask.bitfield.imm64 = 1;
4957 mask.bitfield.imm32s = 1;
4958 break;
4959 case LONG_MNEM_SUFFIX:
4960 mask.bitfield.imm32 = 1;
4961 break;
4962 case WORD_MNEM_SUFFIX:
4963 mask.bitfield.imm16 = 1;
4964 break;
4965 case BYTE_MNEM_SUFFIX:
4966 mask.bitfield.imm8 = 1;
4967 break;
4968 default:
4969 break;
4970 }
4971 allowed = operand_type_and (mask, allowed);
4972 if (!operand_type_all_zero (&allowed))
4973 i.types[op] = operand_type_and (i.types[op], mask);
4974 }
4975 break;
4976 }
4977 }
4978 }
4979
4980 /* Try to use the smallest displacement type too. */
4981 static void
4982 optimize_disp (void)
4983 {
4984 int op;
4985
4986 for (op = i.operands; --op >= 0;)
4987 if (operand_type_check (i.types[op], disp))
4988 {
4989 if (i.op[op].disps->X_op == O_constant)
4990 {
4991 offsetT op_disp = i.op[op].disps->X_add_number;
4992
4993 if (i.types[op].bitfield.disp16
4994 && (op_disp & ~(offsetT) 0xffff) == 0)
4995 {
4996 /* If this operand is at most 16 bits, convert
4997 to a signed 16 bit number and don't use 64bit
4998 displacement. */
4999 op_disp = (((op_disp & 0xffff) ^ 0x8000) - 0x8000);
5000 i.types[op].bitfield.disp64 = 0;
5001 }
5002 #ifdef BFD64
5003 /* Optimize 64-bit displacement to 32-bit for 64-bit BFD. */
5004 if (i.types[op].bitfield.disp32
5005 && (op_disp & ~(((offsetT) 2 << 31) - 1)) == 0)
5006 {
5007 /* If this operand is at most 32 bits, convert
5008 to a signed 32 bit number and don't use 64bit
5009 displacement. */
5010 op_disp &= (((offsetT) 2 << 31) - 1);
5011 op_disp = (op_disp ^ ((offsetT) 1 << 31)) - ((addressT) 1 << 31);
5012 i.types[op].bitfield.disp64 = 0;
5013 }
5014 #endif
5015 if (!op_disp && i.types[op].bitfield.baseindex)
5016 {
5017 i.types[op].bitfield.disp8 = 0;
5018 i.types[op].bitfield.disp16 = 0;
5019 i.types[op].bitfield.disp32 = 0;
5020 i.types[op].bitfield.disp32s = 0;
5021 i.types[op].bitfield.disp64 = 0;
5022 i.op[op].disps = 0;
5023 i.disp_operands--;
5024 }
5025 else if (flag_code == CODE_64BIT)
5026 {
5027 if (fits_in_signed_long (op_disp))
5028 {
5029 i.types[op].bitfield.disp64 = 0;
5030 i.types[op].bitfield.disp32s = 1;
5031 }
5032 if (i.prefix[ADDR_PREFIX]
5033 && fits_in_unsigned_long (op_disp))
5034 i.types[op].bitfield.disp32 = 1;
5035 }
5036 if ((i.types[op].bitfield.disp32
5037 || i.types[op].bitfield.disp32s
5038 || i.types[op].bitfield.disp16)
5039 && fits_in_disp8 (op_disp))
5040 i.types[op].bitfield.disp8 = 1;
5041 }
5042 else if (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
5043 || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL)
5044 {
5045 fix_new_exp (frag_now, frag_more (0) - frag_now->fr_literal, 0,
5046 i.op[op].disps, 0, i.reloc[op]);
5047 i.types[op].bitfield.disp8 = 0;
5048 i.types[op].bitfield.disp16 = 0;
5049 i.types[op].bitfield.disp32 = 0;
5050 i.types[op].bitfield.disp32s = 0;
5051 i.types[op].bitfield.disp64 = 0;
5052 }
5053 else
5054 /* We only support 64bit displacement on constants. */
5055 i.types[op].bitfield.disp64 = 0;
5056 }
5057 }
5058
5059 /* Return 1 if there is a match in broadcast bytes between operand
5060 GIVEN and instruction template T. */
5061
5062 static INLINE int
5063 match_broadcast_size (const insn_template *t, unsigned int given)
5064 {
5065 return ((t->opcode_modifier.broadcast == BYTE_BROADCAST
5066 && i.types[given].bitfield.byte)
5067 || (t->opcode_modifier.broadcast == WORD_BROADCAST
5068 && i.types[given].bitfield.word)
5069 || (t->opcode_modifier.broadcast == DWORD_BROADCAST
5070 && i.types[given].bitfield.dword)
5071 || (t->opcode_modifier.broadcast == QWORD_BROADCAST
5072 && i.types[given].bitfield.qword));
5073 }
5074
5075 /* Check if operands are valid for the instruction. */
5076
5077 static int
5078 check_VecOperands (const insn_template *t)
5079 {
5080 unsigned int op;
5081 i386_cpu_flags cpu;
5082 static const i386_cpu_flags avx512 = CPU_ANY_AVX512F_FLAGS;
5083
5084 /* Templates allowing for ZMMword as well as YMMword and/or XMMword for
5085 any one operand are implicity requiring AVX512VL support if the actual
5086 operand size is YMMword or XMMword. Since this function runs after
5087 template matching, there's no need to check for YMMword/XMMword in
5088 the template. */
5089 cpu = cpu_flags_and (t->cpu_flags, avx512);
5090 if (!cpu_flags_all_zero (&cpu)
5091 && !t->cpu_flags.bitfield.cpuavx512vl
5092 && !cpu_arch_flags.bitfield.cpuavx512vl)
5093 {
5094 for (op = 0; op < t->operands; ++op)
5095 {
5096 if (t->operand_types[op].bitfield.zmmword
5097 && (i.types[op].bitfield.ymmword
5098 || i.types[op].bitfield.xmmword))
5099 {
5100 i.error = unsupported;
5101 return 1;
5102 }
5103 }
5104 }
5105
5106 /* Without VSIB byte, we can't have a vector register for index. */
5107 if (!t->opcode_modifier.vecsib
5108 && i.index_reg
5109 && (i.index_reg->reg_type.bitfield.xmmword
5110 || i.index_reg->reg_type.bitfield.ymmword
5111 || i.index_reg->reg_type.bitfield.zmmword))
5112 {
5113 i.error = unsupported_vector_index_register;
5114 return 1;
5115 }
5116
5117 /* Check if default mask is allowed. */
5118 if (t->opcode_modifier.nodefmask
5119 && (!i.mask || i.mask->mask->reg_num == 0))
5120 {
5121 i.error = no_default_mask;
5122 return 1;
5123 }
5124
5125 /* For VSIB byte, we need a vector register for index, and all vector
5126 registers must be distinct. */
5127 if (t->opcode_modifier.vecsib)
5128 {
5129 if (!i.index_reg
5130 || !((t->opcode_modifier.vecsib == VecSIB128
5131 && i.index_reg->reg_type.bitfield.xmmword)
5132 || (t->opcode_modifier.vecsib == VecSIB256
5133 && i.index_reg->reg_type.bitfield.ymmword)
5134 || (t->opcode_modifier.vecsib == VecSIB512
5135 && i.index_reg->reg_type.bitfield.zmmword)))
5136 {
5137 i.error = invalid_vsib_address;
5138 return 1;
5139 }
5140
5141 gas_assert (i.reg_operands == 2 || i.mask);
5142 if (i.reg_operands == 2 && !i.mask)
5143 {
5144 gas_assert (i.types[0].bitfield.regsimd);
5145 gas_assert (i.types[0].bitfield.xmmword
5146 || i.types[0].bitfield.ymmword);
5147 gas_assert (i.types[2].bitfield.regsimd);
5148 gas_assert (i.types[2].bitfield.xmmword
5149 || i.types[2].bitfield.ymmword);
5150 if (operand_check == check_none)
5151 return 0;
5152 if (register_number (i.op[0].regs)
5153 != register_number (i.index_reg)
5154 && register_number (i.op[2].regs)
5155 != register_number (i.index_reg)
5156 && register_number (i.op[0].regs)
5157 != register_number (i.op[2].regs))
5158 return 0;
5159 if (operand_check == check_error)
5160 {
5161 i.error = invalid_vector_register_set;
5162 return 1;
5163 }
5164 as_warn (_("mask, index, and destination registers should be distinct"));
5165 }
5166 else if (i.reg_operands == 1 && i.mask)
5167 {
5168 if (i.types[1].bitfield.regsimd
5169 && (i.types[1].bitfield.xmmword
5170 || i.types[1].bitfield.ymmword
5171 || i.types[1].bitfield.zmmword)
5172 && (register_number (i.op[1].regs)
5173 == register_number (i.index_reg)))
5174 {
5175 if (operand_check == check_error)
5176 {
5177 i.error = invalid_vector_register_set;
5178 return 1;
5179 }
5180 if (operand_check != check_none)
5181 as_warn (_("index and destination registers should be distinct"));
5182 }
5183 }
5184 }
5185
5186 /* Check if broadcast is supported by the instruction and is applied
5187 to the memory operand. */
5188 if (i.broadcast)
5189 {
5190 i386_operand_type type, overlap;
5191
5192 /* Check if specified broadcast is supported in this instruction,
5193 and its broadcast bytes match the memory operand. */
5194 op = i.broadcast->operand;
5195 if (!t->opcode_modifier.broadcast
5196 || !(i.flags[op] & Operand_Mem)
5197 || (!i.types[op].bitfield.unspecified
5198 && !match_broadcast_size (t, op)))
5199 {
5200 bad_broadcast:
5201 i.error = unsupported_broadcast;
5202 return 1;
5203 }
5204
5205 i.broadcast->bytes = ((1 << (t->opcode_modifier.broadcast - 1))
5206 * i.broadcast->type);
5207 operand_type_set (&type, 0);
5208 switch (i.broadcast->bytes)
5209 {
5210 case 2:
5211 type.bitfield.word = 1;
5212 break;
5213 case 4:
5214 type.bitfield.dword = 1;
5215 break;
5216 case 8:
5217 type.bitfield.qword = 1;
5218 break;
5219 case 16:
5220 type.bitfield.xmmword = 1;
5221 break;
5222 case 32:
5223 type.bitfield.ymmword = 1;
5224 break;
5225 case 64:
5226 type.bitfield.zmmword = 1;
5227 break;
5228 default:
5229 goto bad_broadcast;
5230 }
5231
5232 overlap = operand_type_and (type, t->operand_types[op]);
5233 if (operand_type_all_zero (&overlap))
5234 goto bad_broadcast;
5235
5236 if (t->opcode_modifier.checkregsize)
5237 {
5238 unsigned int j;
5239
5240 type.bitfield.baseindex = 1;
5241 for (j = 0; j < i.operands; ++j)
5242 {
5243 if (j != op
5244 && !operand_type_register_match(i.types[j],
5245 t->operand_types[j],
5246 type,
5247 t->operand_types[op]))
5248 goto bad_broadcast;
5249 }
5250 }
5251 }
5252 /* If broadcast is supported in this instruction, we need to check if
5253 operand of one-element size isn't specified without broadcast. */
5254 else if (t->opcode_modifier.broadcast && i.mem_operands)
5255 {
5256 /* Find memory operand. */
5257 for (op = 0; op < i.operands; op++)
5258 if (operand_type_check (i.types[op], anymem))
5259 break;
5260 gas_assert (op < i.operands);
5261 /* Check size of the memory operand. */
5262 if (match_broadcast_size (t, op))
5263 {
5264 i.error = broadcast_needed;
5265 return 1;
5266 }
5267 }
5268 else
5269 op = MAX_OPERANDS - 1; /* Avoid uninitialized variable warning. */
5270
5271 /* Check if requested masking is supported. */
5272 if (i.mask)
5273 {
5274 switch (t->opcode_modifier.masking)
5275 {
5276 case BOTH_MASKING:
5277 break;
5278 case MERGING_MASKING:
5279 if (i.mask->zeroing)
5280 {
5281 case 0:
5282 i.error = unsupported_masking;
5283 return 1;
5284 }
5285 break;
5286 case DYNAMIC_MASKING:
5287 /* Memory destinations allow only merging masking. */
5288 if (i.mask->zeroing && i.mem_operands)
5289 {
5290 /* Find memory operand. */
5291 for (op = 0; op < i.operands; op++)
5292 if (i.flags[op] & Operand_Mem)
5293 break;
5294 gas_assert (op < i.operands);
5295 if (op == i.operands - 1)
5296 {
5297 i.error = unsupported_masking;
5298 return 1;
5299 }
5300 }
5301 break;
5302 default:
5303 abort ();
5304 }
5305 }
5306
5307 /* Check if masking is applied to dest operand. */
5308 if (i.mask && (i.mask->operand != (int) (i.operands - 1)))
5309 {
5310 i.error = mask_not_on_destination;
5311 return 1;
5312 }
5313
5314 /* Check RC/SAE. */
5315 if (i.rounding)
5316 {
5317 if ((i.rounding->type != saeonly
5318 && !t->opcode_modifier.staticrounding)
5319 || (i.rounding->type == saeonly
5320 && (t->opcode_modifier.staticrounding
5321 || !t->opcode_modifier.sae)))
5322 {
5323 i.error = unsupported_rc_sae;
5324 return 1;
5325 }
5326 /* If the instruction has several immediate operands and one of
5327 them is rounding, the rounding operand should be the last
5328 immediate operand. */
5329 if (i.imm_operands > 1
5330 && i.rounding->operand != (int) (i.imm_operands - 1))
5331 {
5332 i.error = rc_sae_operand_not_last_imm;
5333 return 1;
5334 }
5335 }
5336
5337 /* Check vector Disp8 operand. */
5338 if (t->opcode_modifier.disp8memshift
5339 && i.disp_encoding != disp_encoding_32bit)
5340 {
5341 if (i.broadcast)
5342 i.memshift = t->opcode_modifier.broadcast - 1;
5343 else if (t->opcode_modifier.disp8memshift != DISP8_SHIFT_VL)
5344 i.memshift = t->opcode_modifier.disp8memshift;
5345 else
5346 {
5347 const i386_operand_type *type = NULL;
5348
5349 i.memshift = 0;
5350 for (op = 0; op < i.operands; op++)
5351 if (operand_type_check (i.types[op], anymem))
5352 {
5353 if (t->opcode_modifier.evex == EVEXLIG)
5354 i.memshift = 2 + (i.suffix == QWORD_MNEM_SUFFIX);
5355 else if (t->operand_types[op].bitfield.xmmword
5356 + t->operand_types[op].bitfield.ymmword
5357 + t->operand_types[op].bitfield.zmmword <= 1)
5358 type = &t->operand_types[op];
5359 else if (!i.types[op].bitfield.unspecified)
5360 type = &i.types[op];
5361 }
5362 else if (i.types[op].bitfield.regsimd
5363 && t->opcode_modifier.evex != EVEXLIG)
5364 {
5365 if (i.types[op].bitfield.zmmword)
5366 i.memshift = 6;
5367 else if (i.types[op].bitfield.ymmword && i.memshift < 5)
5368 i.memshift = 5;
5369 else if (i.types[op].bitfield.xmmword && i.memshift < 4)
5370 i.memshift = 4;
5371 }
5372
5373 if (type)
5374 {
5375 if (type->bitfield.zmmword)
5376 i.memshift = 6;
5377 else if (type->bitfield.ymmword)
5378 i.memshift = 5;
5379 else if (type->bitfield.xmmword)
5380 i.memshift = 4;
5381 }
5382
5383 /* For the check in fits_in_disp8(). */
5384 if (i.memshift == 0)
5385 i.memshift = -1;
5386 }
5387
5388 for (op = 0; op < i.operands; op++)
5389 if (operand_type_check (i.types[op], disp)
5390 && i.op[op].disps->X_op == O_constant)
5391 {
5392 if (fits_in_disp8 (i.op[op].disps->X_add_number))
5393 {
5394 i.types[op].bitfield.disp8 = 1;
5395 return 0;
5396 }
5397 i.types[op].bitfield.disp8 = 0;
5398 }
5399 }
5400
5401 i.memshift = 0;
5402
5403 return 0;
5404 }
5405
5406 /* Check if operands are valid for the instruction. Update VEX
5407 operand types. */
5408
5409 static int
5410 VEX_check_operands (const insn_template *t)
5411 {
5412 if (i.vec_encoding == vex_encoding_evex)
5413 {
5414 /* This instruction must be encoded with EVEX prefix. */
5415 if (!is_evex_encoding (t))
5416 {
5417 i.error = unsupported;
5418 return 1;
5419 }
5420 return 0;
5421 }
5422
5423 if (!t->opcode_modifier.vex)
5424 {
5425 /* This instruction template doesn't have VEX prefix. */
5426 if (i.vec_encoding != vex_encoding_default)
5427 {
5428 i.error = unsupported;
5429 return 1;
5430 }
5431 return 0;
5432 }
5433
5434 /* Only check VEX_Imm4, which must be the first operand. */
5435 if (t->operand_types[0].bitfield.vec_imm4)
5436 {
5437 if (i.op[0].imms->X_op != O_constant
5438 || !fits_in_imm4 (i.op[0].imms->X_add_number))
5439 {
5440 i.error = bad_imm4;
5441 return 1;
5442 }
5443
5444 /* Turn off Imm8 so that update_imm won't complain. */
5445 i.types[0] = vec_imm4;
5446 }
5447
5448 return 0;
5449 }
5450
5451 static const insn_template *
5452 match_template (char mnem_suffix)
5453 {
5454 /* Points to template once we've found it. */
5455 const insn_template *t;
5456 i386_operand_type overlap0, overlap1, overlap2, overlap3;
5457 i386_operand_type overlap4;
5458 unsigned int found_reverse_match;
5459 i386_opcode_modifier suffix_check, mnemsuf_check;
5460 i386_operand_type operand_types [MAX_OPERANDS];
5461 int addr_prefix_disp;
5462 unsigned int j;
5463 unsigned int found_cpu_match, size_match;
5464 unsigned int check_register;
5465 enum i386_error specific_error = 0;
5466
5467 #if MAX_OPERANDS != 5
5468 # error "MAX_OPERANDS must be 5."
5469 #endif
5470
5471 found_reverse_match = 0;
5472 addr_prefix_disp = -1;
5473
5474 memset (&suffix_check, 0, sizeof (suffix_check));
5475 if (intel_syntax && i.broadcast)
5476 /* nothing */;
5477 else if (i.suffix == BYTE_MNEM_SUFFIX)
5478 suffix_check.no_bsuf = 1;
5479 else if (i.suffix == WORD_MNEM_SUFFIX)
5480 suffix_check.no_wsuf = 1;
5481 else if (i.suffix == SHORT_MNEM_SUFFIX)
5482 suffix_check.no_ssuf = 1;
5483 else if (i.suffix == LONG_MNEM_SUFFIX)
5484 suffix_check.no_lsuf = 1;
5485 else if (i.suffix == QWORD_MNEM_SUFFIX)
5486 suffix_check.no_qsuf = 1;
5487 else if (i.suffix == LONG_DOUBLE_MNEM_SUFFIX)
5488 suffix_check.no_ldsuf = 1;
5489
5490 memset (&mnemsuf_check, 0, sizeof (mnemsuf_check));
5491 if (intel_syntax)
5492 {
5493 switch (mnem_suffix)
5494 {
5495 case BYTE_MNEM_SUFFIX: mnemsuf_check.no_bsuf = 1; break;
5496 case WORD_MNEM_SUFFIX: mnemsuf_check.no_wsuf = 1; break;
5497 case SHORT_MNEM_SUFFIX: mnemsuf_check.no_ssuf = 1; break;
5498 case LONG_MNEM_SUFFIX: mnemsuf_check.no_lsuf = 1; break;
5499 case QWORD_MNEM_SUFFIX: mnemsuf_check.no_qsuf = 1; break;
5500 }
5501 }
5502
5503 /* Must have right number of operands. */
5504 i.error = number_of_operands_mismatch;
5505
5506 for (t = current_templates->start; t < current_templates->end; t++)
5507 {
5508 addr_prefix_disp = -1;
5509
5510 if (i.operands != t->operands)
5511 continue;
5512
5513 /* Check processor support. */
5514 i.error = unsupported;
5515 found_cpu_match = (cpu_flags_match (t)
5516 == CPU_FLAGS_PERFECT_MATCH);
5517 if (!found_cpu_match)
5518 continue;
5519
5520 /* Check AT&T mnemonic. */
5521 i.error = unsupported_with_intel_mnemonic;
5522 if (intel_mnemonic && t->opcode_modifier.attmnemonic)
5523 continue;
5524
5525 /* Check AT&T/Intel syntax and Intel64/AMD64 ISA. */
5526 i.error = unsupported_syntax;
5527 if ((intel_syntax && t->opcode_modifier.attsyntax)
5528 || (!intel_syntax && t->opcode_modifier.intelsyntax)
5529 || (intel64 && t->opcode_modifier.amd64)
5530 || (!intel64 && t->opcode_modifier.intel64))
5531 continue;
5532
5533 /* Check the suffix, except for some instructions in intel mode. */
5534 i.error = invalid_instruction_suffix;
5535 if ((!intel_syntax || !t->opcode_modifier.ignoresize)
5536 && ((t->opcode_modifier.no_bsuf && suffix_check.no_bsuf)
5537 || (t->opcode_modifier.no_wsuf && suffix_check.no_wsuf)
5538 || (t->opcode_modifier.no_lsuf && suffix_check.no_lsuf)
5539 || (t->opcode_modifier.no_ssuf && suffix_check.no_ssuf)
5540 || (t->opcode_modifier.no_qsuf && suffix_check.no_qsuf)
5541 || (t->opcode_modifier.no_ldsuf && suffix_check.no_ldsuf)))
5542 continue;
5543 /* In Intel mode all mnemonic suffixes must be explicitly allowed. */
5544 if ((t->opcode_modifier.no_bsuf && mnemsuf_check.no_bsuf)
5545 || (t->opcode_modifier.no_wsuf && mnemsuf_check.no_wsuf)
5546 || (t->opcode_modifier.no_lsuf && mnemsuf_check.no_lsuf)
5547 || (t->opcode_modifier.no_ssuf && mnemsuf_check.no_ssuf)
5548 || (t->opcode_modifier.no_qsuf && mnemsuf_check.no_qsuf)
5549 || (t->opcode_modifier.no_ldsuf && mnemsuf_check.no_ldsuf))
5550 continue;
5551
5552 size_match = operand_size_match (t);
5553 if (!size_match)
5554 continue;
5555
5556 for (j = 0; j < MAX_OPERANDS; j++)
5557 operand_types[j] = t->operand_types[j];
5558
5559 /* In general, don't allow 64-bit operands in 32-bit mode. */
5560 if (i.suffix == QWORD_MNEM_SUFFIX
5561 && flag_code != CODE_64BIT
5562 && (intel_syntax
5563 ? (!t->opcode_modifier.ignoresize
5564 && !t->opcode_modifier.broadcast
5565 && !intel_float_operand (t->name))
5566 : intel_float_operand (t->name) != 2)
5567 && ((!operand_types[0].bitfield.regmmx
5568 && !operand_types[0].bitfield.regsimd)
5569 || (!operand_types[t->operands > 1].bitfield.regmmx
5570 && !operand_types[t->operands > 1].bitfield.regsimd))
5571 && (t->base_opcode != 0x0fc7
5572 || t->extension_opcode != 1 /* cmpxchg8b */))
5573 continue;
5574
5575 /* In general, don't allow 32-bit operands on pre-386. */
5576 else if (i.suffix == LONG_MNEM_SUFFIX
5577 && !cpu_arch_flags.bitfield.cpui386
5578 && (intel_syntax
5579 ? (!t->opcode_modifier.ignoresize
5580 && !intel_float_operand (t->name))
5581 : intel_float_operand (t->name) != 2)
5582 && ((!operand_types[0].bitfield.regmmx
5583 && !operand_types[0].bitfield.regsimd)
5584 || (!operand_types[t->operands > 1].bitfield.regmmx
5585 && !operand_types[t->operands > 1].bitfield.regsimd)))
5586 continue;
5587
5588 /* Do not verify operands when there are none. */
5589 else
5590 {
5591 if (!t->operands)
5592 /* We've found a match; break out of loop. */
5593 break;
5594 }
5595
5596 /* Address size prefix will turn Disp64/Disp32/Disp16 operand
5597 into Disp32/Disp16/Disp32 operand. */
5598 if (i.prefix[ADDR_PREFIX] != 0)
5599 {
5600 /* There should be only one Disp operand. */
5601 switch (flag_code)
5602 {
5603 case CODE_16BIT:
5604 for (j = 0; j < MAX_OPERANDS; j++)
5605 {
5606 if (operand_types[j].bitfield.disp16)
5607 {
5608 addr_prefix_disp = j;
5609 operand_types[j].bitfield.disp32 = 1;
5610 operand_types[j].bitfield.disp16 = 0;
5611 break;
5612 }
5613 }
5614 break;
5615 case CODE_32BIT:
5616 for (j = 0; j < MAX_OPERANDS; j++)
5617 {
5618 if (operand_types[j].bitfield.disp32)
5619 {
5620 addr_prefix_disp = j;
5621 operand_types[j].bitfield.disp32 = 0;
5622 operand_types[j].bitfield.disp16 = 1;
5623 break;
5624 }
5625 }
5626 break;
5627 case CODE_64BIT:
5628 for (j = 0; j < MAX_OPERANDS; j++)
5629 {
5630 if (operand_types[j].bitfield.disp64)
5631 {
5632 addr_prefix_disp = j;
5633 operand_types[j].bitfield.disp64 = 0;
5634 operand_types[j].bitfield.disp32 = 1;
5635 break;
5636 }
5637 }
5638 break;
5639 }
5640 }
5641
5642 /* Force 0x8b encoding for "mov foo@GOT, %eax". */
5643 if (i.reloc[0] == BFD_RELOC_386_GOT32 && t->base_opcode == 0xa0)
5644 continue;
5645
5646 /* We check register size if needed. */
5647 if (t->opcode_modifier.checkregsize)
5648 {
5649 check_register = (1 << t->operands) - 1;
5650 if (i.broadcast)
5651 check_register &= ~(1 << i.broadcast->operand);
5652 }
5653 else
5654 check_register = 0;
5655
5656 overlap0 = operand_type_and (i.types[0], operand_types[0]);
5657 switch (t->operands)
5658 {
5659 case 1:
5660 if (!operand_type_match (overlap0, i.types[0]))
5661 continue;
5662 break;
5663 case 2:
5664 /* xchg %eax, %eax is a special case. It is an alias for nop
5665 only in 32bit mode and we can use opcode 0x90. In 64bit
5666 mode, we can't use 0x90 for xchg %eax, %eax since it should
5667 zero-extend %eax to %rax. */
5668 if (flag_code == CODE_64BIT
5669 && t->base_opcode == 0x90
5670 && operand_type_equal (&i.types [0], &acc32)
5671 && operand_type_equal (&i.types [1], &acc32))
5672 continue;
5673 /* xrelease mov %eax, <disp> is another special case. It must not
5674 match the accumulator-only encoding of mov. */
5675 if (flag_code != CODE_64BIT
5676 && i.hle_prefix
5677 && t->base_opcode == 0xa0
5678 && i.types[0].bitfield.acc
5679 && operand_type_check (i.types[1], anymem))
5680 continue;
5681 if (!(size_match & MATCH_STRAIGHT))
5682 goto check_reverse;
5683 /* If we want store form, we reverse direction of operands. */
5684 if (i.dir_encoding == dir_encoding_store
5685 && t->opcode_modifier.d)
5686 goto check_reverse;
5687 /* Fall through. */
5688
5689 case 3:
5690 /* If we want store form, we skip the current load. */
5691 if (i.dir_encoding == dir_encoding_store
5692 && i.mem_operands == 0
5693 && t->opcode_modifier.load)
5694 continue;
5695 /* Fall through. */
5696 case 4:
5697 case 5:
5698 overlap1 = operand_type_and (i.types[1], operand_types[1]);
5699 if (!operand_type_match (overlap0, i.types[0])
5700 || !operand_type_match (overlap1, i.types[1])
5701 || ((check_register & 3) == 3
5702 && !operand_type_register_match (i.types[0],
5703 operand_types[0],
5704 i.types[1],
5705 operand_types[1])))
5706 {
5707 /* Check if other direction is valid ... */
5708 if (!t->opcode_modifier.d)
5709 continue;
5710
5711 check_reverse:
5712 if (!(size_match & MATCH_REVERSE))
5713 continue;
5714 /* Try reversing direction of operands. */
5715 overlap0 = operand_type_and (i.types[0], operand_types[1]);
5716 overlap1 = operand_type_and (i.types[1], operand_types[0]);
5717 if (!operand_type_match (overlap0, i.types[0])
5718 || !operand_type_match (overlap1, i.types[1])
5719 || (check_register
5720 && !operand_type_register_match (i.types[0],
5721 operand_types[1],
5722 i.types[1],
5723 operand_types[0])))
5724 {
5725 /* Does not match either direction. */
5726 continue;
5727 }
5728 /* found_reverse_match holds which of D or FloatR
5729 we've found. */
5730 if (!t->opcode_modifier.d)
5731 found_reverse_match = 0;
5732 else if (operand_types[0].bitfield.tbyte)
5733 found_reverse_match = Opcode_FloatD;
5734 else
5735 found_reverse_match = Opcode_D;
5736 if (t->opcode_modifier.floatr)
5737 found_reverse_match |= Opcode_FloatR;
5738 }
5739 else
5740 {
5741 /* Found a forward 2 operand match here. */
5742 switch (t->operands)
5743 {
5744 case 5:
5745 overlap4 = operand_type_and (i.types[4],
5746 operand_types[4]);
5747 /* Fall through. */
5748 case 4:
5749 overlap3 = operand_type_and (i.types[3],
5750 operand_types[3]);
5751 /* Fall through. */
5752 case 3:
5753 overlap2 = operand_type_and (i.types[2],
5754 operand_types[2]);
5755 break;
5756 }
5757
5758 switch (t->operands)
5759 {
5760 case 5:
5761 if (!operand_type_match (overlap4, i.types[4])
5762 || !operand_type_register_match (i.types[3],
5763 operand_types[3],
5764 i.types[4],
5765 operand_types[4]))
5766 continue;
5767 /* Fall through. */
5768 case 4:
5769 if (!operand_type_match (overlap3, i.types[3])
5770 || ((check_register & 0xa) == 0xa
5771 && !operand_type_register_match (i.types[1],
5772 operand_types[1],
5773 i.types[3],
5774 operand_types[3]))
5775 || ((check_register & 0xc) == 0xc
5776 && !operand_type_register_match (i.types[2],
5777 operand_types[2],
5778 i.types[3],
5779 operand_types[3])))
5780 continue;
5781 /* Fall through. */
5782 case 3:
5783 /* Here we make use of the fact that there are no
5784 reverse match 3 operand instructions. */
5785 if (!operand_type_match (overlap2, i.types[2])
5786 || ((check_register & 5) == 5
5787 && !operand_type_register_match (i.types[0],
5788 operand_types[0],
5789 i.types[2],
5790 operand_types[2]))
5791 || ((check_register & 6) == 6
5792 && !operand_type_register_match (i.types[1],
5793 operand_types[1],
5794 i.types[2],
5795 operand_types[2])))
5796 continue;
5797 break;
5798 }
5799 }
5800 /* Found either forward/reverse 2, 3 or 4 operand match here:
5801 slip through to break. */
5802 }
5803 if (!found_cpu_match)
5804 {
5805 found_reverse_match = 0;
5806 continue;
5807 }
5808
5809 /* Check if vector and VEX operands are valid. */
5810 if (check_VecOperands (t) || VEX_check_operands (t))
5811 {
5812 specific_error = i.error;
5813 continue;
5814 }
5815
5816 /* We've found a match; break out of loop. */
5817 break;
5818 }
5819
5820 if (t == current_templates->end)
5821 {
5822 /* We found no match. */
5823 const char *err_msg;
5824 switch (specific_error ? specific_error : i.error)
5825 {
5826 default:
5827 abort ();
5828 case operand_size_mismatch:
5829 err_msg = _("operand size mismatch");
5830 break;
5831 case operand_type_mismatch:
5832 err_msg = _("operand type mismatch");
5833 break;
5834 case register_type_mismatch:
5835 err_msg = _("register type mismatch");
5836 break;
5837 case number_of_operands_mismatch:
5838 err_msg = _("number of operands mismatch");
5839 break;
5840 case invalid_instruction_suffix:
5841 err_msg = _("invalid instruction suffix");
5842 break;
5843 case bad_imm4:
5844 err_msg = _("constant doesn't fit in 4 bits");
5845 break;
5846 case unsupported_with_intel_mnemonic:
5847 err_msg = _("unsupported with Intel mnemonic");
5848 break;
5849 case unsupported_syntax:
5850 err_msg = _("unsupported syntax");
5851 break;
5852 case unsupported:
5853 as_bad (_("unsupported instruction `%s'"),
5854 current_templates->start->name);
5855 return NULL;
5856 case invalid_vsib_address:
5857 err_msg = _("invalid VSIB address");
5858 break;
5859 case invalid_vector_register_set:
5860 err_msg = _("mask, index, and destination registers must be distinct");
5861 break;
5862 case unsupported_vector_index_register:
5863 err_msg = _("unsupported vector index register");
5864 break;
5865 case unsupported_broadcast:
5866 err_msg = _("unsupported broadcast");
5867 break;
5868 case broadcast_needed:
5869 err_msg = _("broadcast is needed for operand of such type");
5870 break;
5871 case unsupported_masking:
5872 err_msg = _("unsupported masking");
5873 break;
5874 case mask_not_on_destination:
5875 err_msg = _("mask not on destination operand");
5876 break;
5877 case no_default_mask:
5878 err_msg = _("default mask isn't allowed");
5879 break;
5880 case unsupported_rc_sae:
5881 err_msg = _("unsupported static rounding/sae");
5882 break;
5883 case rc_sae_operand_not_last_imm:
5884 if (intel_syntax)
5885 err_msg = _("RC/SAE operand must precede immediate operands");
5886 else
5887 err_msg = _("RC/SAE operand must follow immediate operands");
5888 break;
5889 case invalid_register_operand:
5890 err_msg = _("invalid register operand");
5891 break;
5892 }
5893 as_bad (_("%s for `%s'"), err_msg,
5894 current_templates->start->name);
5895 return NULL;
5896 }
5897
5898 if (!quiet_warnings)
5899 {
5900 if (!intel_syntax
5901 && (i.types[0].bitfield.jumpabsolute
5902 != operand_types[0].bitfield.jumpabsolute))
5903 {
5904 as_warn (_("indirect %s without `*'"), t->name);
5905 }
5906
5907 if (t->opcode_modifier.isprefix
5908 && t->opcode_modifier.ignoresize)
5909 {
5910 /* Warn them that a data or address size prefix doesn't
5911 affect assembly of the next line of code. */
5912 as_warn (_("stand-alone `%s' prefix"), t->name);
5913 }
5914 }
5915
5916 /* Copy the template we found. */
5917 i.tm = *t;
5918
5919 if (addr_prefix_disp != -1)
5920 i.tm.operand_types[addr_prefix_disp]
5921 = operand_types[addr_prefix_disp];
5922
5923 if (found_reverse_match)
5924 {
5925 /* If we found a reverse match we must alter the opcode
5926 direction bit. found_reverse_match holds bits to change
5927 (different for int & float insns). */
5928
5929 i.tm.base_opcode ^= found_reverse_match;
5930
5931 i.tm.operand_types[0] = operand_types[1];
5932 i.tm.operand_types[1] = operand_types[0];
5933 }
5934
5935 return t;
5936 }
5937
5938 static int
5939 check_string (void)
5940 {
5941 int mem_op = operand_type_check (i.types[0], anymem) ? 0 : 1;
5942 if (i.tm.operand_types[mem_op].bitfield.esseg)
5943 {
5944 if (i.seg[0] != NULL && i.seg[0] != &es)
5945 {
5946 as_bad (_("`%s' operand %d must use `%ses' segment"),
5947 i.tm.name,
5948 mem_op + 1,
5949 register_prefix);
5950 return 0;
5951 }
5952 /* There's only ever one segment override allowed per instruction.
5953 This instruction possibly has a legal segment override on the
5954 second operand, so copy the segment to where non-string
5955 instructions store it, allowing common code. */
5956 i.seg[0] = i.seg[1];
5957 }
5958 else if (i.tm.operand_types[mem_op + 1].bitfield.esseg)
5959 {
5960 if (i.seg[1] != NULL && i.seg[1] != &es)
5961 {
5962 as_bad (_("`%s' operand %d must use `%ses' segment"),
5963 i.tm.name,
5964 mem_op + 2,
5965 register_prefix);
5966 return 0;
5967 }
5968 }
5969 return 1;
5970 }
5971
5972 static int
5973 process_suffix (void)
5974 {
5975 /* If matched instruction specifies an explicit instruction mnemonic
5976 suffix, use it. */
5977 if (i.tm.opcode_modifier.size16)
5978 i.suffix = WORD_MNEM_SUFFIX;
5979 else if (i.tm.opcode_modifier.size32)
5980 i.suffix = LONG_MNEM_SUFFIX;
5981 else if (i.tm.opcode_modifier.size64)
5982 i.suffix = QWORD_MNEM_SUFFIX;
5983 else if (i.reg_operands)
5984 {
5985 /* If there's no instruction mnemonic suffix we try to invent one
5986 based on register operands. */
5987 if (!i.suffix)
5988 {
5989 /* We take i.suffix from the last register operand specified,
5990 Destination register type is more significant than source
5991 register type. crc32 in SSE4.2 prefers source register
5992 type. */
5993 if (i.tm.base_opcode == 0xf20f38f1)
5994 {
5995 if (i.types[0].bitfield.reg && i.types[0].bitfield.word)
5996 i.suffix = WORD_MNEM_SUFFIX;
5997 else if (i.types[0].bitfield.reg && i.types[0].bitfield.dword)
5998 i.suffix = LONG_MNEM_SUFFIX;
5999 else if (i.types[0].bitfield.reg && i.types[0].bitfield.qword)
6000 i.suffix = QWORD_MNEM_SUFFIX;
6001 }
6002 else if (i.tm.base_opcode == 0xf20f38f0)
6003 {
6004 if (i.types[0].bitfield.reg && i.types[0].bitfield.byte)
6005 i.suffix = BYTE_MNEM_SUFFIX;
6006 }
6007
6008 if (!i.suffix)
6009 {
6010 int op;
6011
6012 if (i.tm.base_opcode == 0xf20f38f1
6013 || i.tm.base_opcode == 0xf20f38f0)
6014 {
6015 /* We have to know the operand size for crc32. */
6016 as_bad (_("ambiguous memory operand size for `%s`"),
6017 i.tm.name);
6018 return 0;
6019 }
6020
6021 for (op = i.operands; --op >= 0;)
6022 if (!i.tm.operand_types[op].bitfield.inoutportreg
6023 && !i.tm.operand_types[op].bitfield.shiftcount)
6024 {
6025 if (!i.types[op].bitfield.reg)
6026 continue;
6027 if (i.types[op].bitfield.byte)
6028 i.suffix = BYTE_MNEM_SUFFIX;
6029 else if (i.types[op].bitfield.word)
6030 i.suffix = WORD_MNEM_SUFFIX;
6031 else if (i.types[op].bitfield.dword)
6032 i.suffix = LONG_MNEM_SUFFIX;
6033 else if (i.types[op].bitfield.qword)
6034 i.suffix = QWORD_MNEM_SUFFIX;
6035 else
6036 continue;
6037 break;
6038 }
6039 }
6040 }
6041 else if (i.suffix == BYTE_MNEM_SUFFIX)
6042 {
6043 if (intel_syntax
6044 && i.tm.opcode_modifier.ignoresize
6045 && i.tm.opcode_modifier.no_bsuf)
6046 i.suffix = 0;
6047 else if (!check_byte_reg ())
6048 return 0;
6049 }
6050 else if (i.suffix == LONG_MNEM_SUFFIX)
6051 {
6052 if (intel_syntax
6053 && i.tm.opcode_modifier.ignoresize
6054 && i.tm.opcode_modifier.no_lsuf
6055 && !i.tm.opcode_modifier.todword
6056 && !i.tm.opcode_modifier.toqword)
6057 i.suffix = 0;
6058 else if (!check_long_reg ())
6059 return 0;
6060 }
6061 else if (i.suffix == QWORD_MNEM_SUFFIX)
6062 {
6063 if (intel_syntax
6064 && i.tm.opcode_modifier.ignoresize
6065 && i.tm.opcode_modifier.no_qsuf
6066 && !i.tm.opcode_modifier.todword
6067 && !i.tm.opcode_modifier.toqword)
6068 i.suffix = 0;
6069 else if (!check_qword_reg ())
6070 return 0;
6071 }
6072 else if (i.suffix == WORD_MNEM_SUFFIX)
6073 {
6074 if (intel_syntax
6075 && i.tm.opcode_modifier.ignoresize
6076 && i.tm.opcode_modifier.no_wsuf)
6077 i.suffix = 0;
6078 else if (!check_word_reg ())
6079 return 0;
6080 }
6081 else if (intel_syntax && i.tm.opcode_modifier.ignoresize)
6082 /* Do nothing if the instruction is going to ignore the prefix. */
6083 ;
6084 else
6085 abort ();
6086 }
6087 else if (i.tm.opcode_modifier.defaultsize
6088 && !i.suffix
6089 /* exclude fldenv/frstor/fsave/fstenv */
6090 && i.tm.opcode_modifier.no_ssuf)
6091 {
6092 i.suffix = stackop_size;
6093 }
6094 else if (intel_syntax
6095 && !i.suffix
6096 && (i.tm.operand_types[0].bitfield.jumpabsolute
6097 || i.tm.opcode_modifier.jumpbyte
6098 || i.tm.opcode_modifier.jumpintersegment
6099 || (i.tm.base_opcode == 0x0f01 /* [ls][gi]dt */
6100 && i.tm.extension_opcode <= 3)))
6101 {
6102 switch (flag_code)
6103 {
6104 case CODE_64BIT:
6105 if (!i.tm.opcode_modifier.no_qsuf)
6106 {
6107 i.suffix = QWORD_MNEM_SUFFIX;
6108 break;
6109 }
6110 /* Fall through. */
6111 case CODE_32BIT:
6112 if (!i.tm.opcode_modifier.no_lsuf)
6113 i.suffix = LONG_MNEM_SUFFIX;
6114 break;
6115 case CODE_16BIT:
6116 if (!i.tm.opcode_modifier.no_wsuf)
6117 i.suffix = WORD_MNEM_SUFFIX;
6118 break;
6119 }
6120 }
6121
6122 if (!i.suffix)
6123 {
6124 if (!intel_syntax)
6125 {
6126 if (i.tm.opcode_modifier.w)
6127 {
6128 as_bad (_("no instruction mnemonic suffix given and "
6129 "no register operands; can't size instruction"));
6130 return 0;
6131 }
6132 }
6133 else
6134 {
6135 unsigned int suffixes;
6136
6137 suffixes = !i.tm.opcode_modifier.no_bsuf;
6138 if (!i.tm.opcode_modifier.no_wsuf)
6139 suffixes |= 1 << 1;
6140 if (!i.tm.opcode_modifier.no_lsuf)
6141 suffixes |= 1 << 2;
6142 if (!i.tm.opcode_modifier.no_ldsuf)
6143 suffixes |= 1 << 3;
6144 if (!i.tm.opcode_modifier.no_ssuf)
6145 suffixes |= 1 << 4;
6146 if (flag_code == CODE_64BIT && !i.tm.opcode_modifier.no_qsuf)
6147 suffixes |= 1 << 5;
6148
6149 /* There are more than suffix matches. */
6150 if (i.tm.opcode_modifier.w
6151 || ((suffixes & (suffixes - 1))
6152 && !i.tm.opcode_modifier.defaultsize
6153 && !i.tm.opcode_modifier.ignoresize))
6154 {
6155 as_bad (_("ambiguous operand size for `%s'"), i.tm.name);
6156 return 0;
6157 }
6158 }
6159 }
6160
6161 /* Change the opcode based on the operand size given by i.suffix. */
6162 switch (i.suffix)
6163 {
6164 /* Size floating point instruction. */
6165 case LONG_MNEM_SUFFIX:
6166 if (i.tm.opcode_modifier.floatmf)
6167 {
6168 i.tm.base_opcode ^= 4;
6169 break;
6170 }
6171 /* fall through */
6172 case WORD_MNEM_SUFFIX:
6173 case QWORD_MNEM_SUFFIX:
6174 /* It's not a byte, select word/dword operation. */
6175 if (i.tm.opcode_modifier.w)
6176 {
6177 if (i.tm.opcode_modifier.shortform)
6178 i.tm.base_opcode |= 8;
6179 else
6180 i.tm.base_opcode |= 1;
6181 }
6182 /* fall through */
6183 case SHORT_MNEM_SUFFIX:
6184 /* Now select between word & dword operations via the operand
6185 size prefix, except for instructions that will ignore this
6186 prefix anyway. */
6187 if (i.reg_operands > 0
6188 && i.types[0].bitfield.reg
6189 && i.tm.opcode_modifier.addrprefixopreg
6190 && (i.tm.opcode_modifier.immext
6191 || i.operands == 1))
6192 {
6193 /* The address size override prefix changes the size of the
6194 first operand. */
6195 if ((flag_code == CODE_32BIT
6196 && i.op[0].regs->reg_type.bitfield.word)
6197 || (flag_code != CODE_32BIT
6198 && i.op[0].regs->reg_type.bitfield.dword))
6199 if (!add_prefix (ADDR_PREFIX_OPCODE))
6200 return 0;
6201 }
6202 else if (i.suffix != QWORD_MNEM_SUFFIX
6203 && !i.tm.opcode_modifier.ignoresize
6204 && !i.tm.opcode_modifier.floatmf
6205 && !i.tm.opcode_modifier.vex
6206 && !i.tm.opcode_modifier.vexopcode
6207 && !is_evex_encoding (&i.tm)
6208 && ((i.suffix == LONG_MNEM_SUFFIX) == (flag_code == CODE_16BIT)
6209 || (flag_code == CODE_64BIT
6210 && i.tm.opcode_modifier.jumpbyte)))
6211 {
6212 unsigned int prefix = DATA_PREFIX_OPCODE;
6213
6214 if (i.tm.opcode_modifier.jumpbyte) /* jcxz, loop */
6215 prefix = ADDR_PREFIX_OPCODE;
6216
6217 if (!add_prefix (prefix))
6218 return 0;
6219 }
6220
6221 /* Set mode64 for an operand. */
6222 if (i.suffix == QWORD_MNEM_SUFFIX
6223 && flag_code == CODE_64BIT
6224 && !i.tm.opcode_modifier.norex64
6225 /* Special case for xchg %rax,%rax. It is NOP and doesn't
6226 need rex64. */
6227 && ! (i.operands == 2
6228 && i.tm.base_opcode == 0x90
6229 && i.tm.extension_opcode == None
6230 && operand_type_equal (&i.types [0], &acc64)
6231 && operand_type_equal (&i.types [1], &acc64)))
6232 i.rex |= REX_W;
6233
6234 break;
6235 }
6236
6237 if (i.reg_operands != 0
6238 && i.operands > 1
6239 && i.tm.opcode_modifier.addrprefixopreg
6240 && !i.tm.opcode_modifier.immext)
6241 {
6242 /* Check invalid register operand when the address size override
6243 prefix changes the size of register operands. */
6244 unsigned int op;
6245 enum { need_word, need_dword, need_qword } need;
6246
6247 if (flag_code == CODE_32BIT)
6248 need = i.prefix[ADDR_PREFIX] ? need_word : need_dword;
6249 else
6250 {
6251 if (i.prefix[ADDR_PREFIX])
6252 need = need_dword;
6253 else
6254 need = flag_code == CODE_64BIT ? need_qword : need_word;
6255 }
6256
6257 for (op = 0; op < i.operands; op++)
6258 if (i.types[op].bitfield.reg
6259 && ((need == need_word
6260 && !i.op[op].regs->reg_type.bitfield.word)
6261 || (need == need_dword
6262 && !i.op[op].regs->reg_type.bitfield.dword)
6263 || (need == need_qword
6264 && !i.op[op].regs->reg_type.bitfield.qword)))
6265 {
6266 as_bad (_("invalid register operand size for `%s'"),
6267 i.tm.name);
6268 return 0;
6269 }
6270 }
6271
6272 return 1;
6273 }
6274
6275 static int
6276 check_byte_reg (void)
6277 {
6278 int op;
6279
6280 for (op = i.operands; --op >= 0;)
6281 {
6282 /* Skip non-register operands. */
6283 if (!i.types[op].bitfield.reg)
6284 continue;
6285
6286 /* If this is an eight bit register, it's OK. If it's the 16 or
6287 32 bit version of an eight bit register, we will just use the
6288 low portion, and that's OK too. */
6289 if (i.types[op].bitfield.byte)
6290 continue;
6291
6292 /* I/O port address operands are OK too. */
6293 if (i.tm.operand_types[op].bitfield.inoutportreg)
6294 continue;
6295
6296 /* crc32 doesn't generate this warning. */
6297 if (i.tm.base_opcode == 0xf20f38f0)
6298 continue;
6299
6300 if ((i.types[op].bitfield.word
6301 || i.types[op].bitfield.dword
6302 || i.types[op].bitfield.qword)
6303 && i.op[op].regs->reg_num < 4
6304 /* Prohibit these changes in 64bit mode, since the lowering
6305 would be more complicated. */
6306 && flag_code != CODE_64BIT)
6307 {
6308 #if REGISTER_WARNINGS
6309 if (!quiet_warnings)
6310 as_warn (_("using `%s%s' instead of `%s%s' due to `%c' suffix"),
6311 register_prefix,
6312 (i.op[op].regs + (i.types[op].bitfield.word
6313 ? REGNAM_AL - REGNAM_AX
6314 : REGNAM_AL - REGNAM_EAX))->reg_name,
6315 register_prefix,
6316 i.op[op].regs->reg_name,
6317 i.suffix);
6318 #endif
6319 continue;
6320 }
6321 /* Any other register is bad. */
6322 if (i.types[op].bitfield.reg
6323 || i.types[op].bitfield.regmmx
6324 || i.types[op].bitfield.regsimd
6325 || i.types[op].bitfield.sreg2
6326 || i.types[op].bitfield.sreg3
6327 || i.types[op].bitfield.control
6328 || i.types[op].bitfield.debug
6329 || i.types[op].bitfield.test)
6330 {
6331 as_bad (_("`%s%s' not allowed with `%s%c'"),
6332 register_prefix,
6333 i.op[op].regs->reg_name,
6334 i.tm.name,
6335 i.suffix);
6336 return 0;
6337 }
6338 }
6339 return 1;
6340 }
6341
6342 static int
6343 check_long_reg (void)
6344 {
6345 int op;
6346
6347 for (op = i.operands; --op >= 0;)
6348 /* Skip non-register operands. */
6349 if (!i.types[op].bitfield.reg)
6350 continue;
6351 /* Reject eight bit registers, except where the template requires
6352 them. (eg. movzb) */
6353 else if (i.types[op].bitfield.byte
6354 && (i.tm.operand_types[op].bitfield.reg
6355 || i.tm.operand_types[op].bitfield.acc)
6356 && (i.tm.operand_types[op].bitfield.word
6357 || i.tm.operand_types[op].bitfield.dword))
6358 {
6359 as_bad (_("`%s%s' not allowed with `%s%c'"),
6360 register_prefix,
6361 i.op[op].regs->reg_name,
6362 i.tm.name,
6363 i.suffix);
6364 return 0;
6365 }
6366 /* Warn if the e prefix on a general reg is missing. */
6367 else if ((!quiet_warnings || flag_code == CODE_64BIT)
6368 && i.types[op].bitfield.word
6369 && (i.tm.operand_types[op].bitfield.reg
6370 || i.tm.operand_types[op].bitfield.acc)
6371 && i.tm.operand_types[op].bitfield.dword)
6372 {
6373 /* Prohibit these changes in the 64bit mode, since the
6374 lowering is more complicated. */
6375 if (flag_code == CODE_64BIT)
6376 {
6377 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
6378 register_prefix, i.op[op].regs->reg_name,
6379 i.suffix);
6380 return 0;
6381 }
6382 #if REGISTER_WARNINGS
6383 as_warn (_("using `%s%s' instead of `%s%s' due to `%c' suffix"),
6384 register_prefix,
6385 (i.op[op].regs + REGNAM_EAX - REGNAM_AX)->reg_name,
6386 register_prefix, i.op[op].regs->reg_name, i.suffix);
6387 #endif
6388 }
6389 /* Warn if the r prefix on a general reg is present. */
6390 else if (i.types[op].bitfield.qword
6391 && (i.tm.operand_types[op].bitfield.reg
6392 || i.tm.operand_types[op].bitfield.acc)
6393 && i.tm.operand_types[op].bitfield.dword)
6394 {
6395 if (intel_syntax
6396 && i.tm.opcode_modifier.toqword
6397 && !i.types[0].bitfield.regsimd)
6398 {
6399 /* Convert to QWORD. We want REX byte. */
6400 i.suffix = QWORD_MNEM_SUFFIX;
6401 }
6402 else
6403 {
6404 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
6405 register_prefix, i.op[op].regs->reg_name,
6406 i.suffix);
6407 return 0;
6408 }
6409 }
6410 return 1;
6411 }
6412
6413 static int
6414 check_qword_reg (void)
6415 {
6416 int op;
6417
6418 for (op = i.operands; --op >= 0; )
6419 /* Skip non-register operands. */
6420 if (!i.types[op].bitfield.reg)
6421 continue;
6422 /* Reject eight bit registers, except where the template requires
6423 them. (eg. movzb) */
6424 else if (i.types[op].bitfield.byte
6425 && (i.tm.operand_types[op].bitfield.reg
6426 || i.tm.operand_types[op].bitfield.acc)
6427 && (i.tm.operand_types[op].bitfield.word
6428 || i.tm.operand_types[op].bitfield.dword))
6429 {
6430 as_bad (_("`%s%s' not allowed with `%s%c'"),
6431 register_prefix,
6432 i.op[op].regs->reg_name,
6433 i.tm.name,
6434 i.suffix);
6435 return 0;
6436 }
6437 /* Warn if the r prefix on a general reg is missing. */
6438 else if ((i.types[op].bitfield.word
6439 || i.types[op].bitfield.dword)
6440 && (i.tm.operand_types[op].bitfield.reg
6441 || i.tm.operand_types[op].bitfield.acc)
6442 && i.tm.operand_types[op].bitfield.qword)
6443 {
6444 /* Prohibit these changes in the 64bit mode, since the
6445 lowering is more complicated. */
6446 if (intel_syntax
6447 && i.tm.opcode_modifier.todword
6448 && !i.types[0].bitfield.regsimd)
6449 {
6450 /* Convert to DWORD. We don't want REX byte. */
6451 i.suffix = LONG_MNEM_SUFFIX;
6452 }
6453 else
6454 {
6455 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
6456 register_prefix, i.op[op].regs->reg_name,
6457 i.suffix);
6458 return 0;
6459 }
6460 }
6461 return 1;
6462 }
6463
6464 static int
6465 check_word_reg (void)
6466 {
6467 int op;
6468 for (op = i.operands; --op >= 0;)
6469 /* Skip non-register operands. */
6470 if (!i.types[op].bitfield.reg)
6471 continue;
6472 /* Reject eight bit registers, except where the template requires
6473 them. (eg. movzb) */
6474 else if (i.types[op].bitfield.byte
6475 && (i.tm.operand_types[op].bitfield.reg
6476 || i.tm.operand_types[op].bitfield.acc)
6477 && (i.tm.operand_types[op].bitfield.word
6478 || i.tm.operand_types[op].bitfield.dword))
6479 {
6480 as_bad (_("`%s%s' not allowed with `%s%c'"),
6481 register_prefix,
6482 i.op[op].regs->reg_name,
6483 i.tm.name,
6484 i.suffix);
6485 return 0;
6486 }
6487 /* Warn if the e or r prefix on a general reg is present. */
6488 else if ((!quiet_warnings || flag_code == CODE_64BIT)
6489 && (i.types[op].bitfield.dword
6490 || i.types[op].bitfield.qword)
6491 && (i.tm.operand_types[op].bitfield.reg
6492 || i.tm.operand_types[op].bitfield.acc)
6493 && i.tm.operand_types[op].bitfield.word)
6494 {
6495 /* Prohibit these changes in the 64bit mode, since the
6496 lowering is more complicated. */
6497 if (flag_code == CODE_64BIT)
6498 {
6499 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
6500 register_prefix, i.op[op].regs->reg_name,
6501 i.suffix);
6502 return 0;
6503 }
6504 #if REGISTER_WARNINGS
6505 as_warn (_("using `%s%s' instead of `%s%s' due to `%c' suffix"),
6506 register_prefix,
6507 (i.op[op].regs + REGNAM_AX - REGNAM_EAX)->reg_name,
6508 register_prefix, i.op[op].regs->reg_name, i.suffix);
6509 #endif
6510 }
6511 return 1;
6512 }
6513
6514 static int
6515 update_imm (unsigned int j)
6516 {
6517 i386_operand_type overlap = i.types[j];
6518 if ((overlap.bitfield.imm8
6519 || overlap.bitfield.imm8s
6520 || overlap.bitfield.imm16
6521 || overlap.bitfield.imm32
6522 || overlap.bitfield.imm32s
6523 || overlap.bitfield.imm64)
6524 && !operand_type_equal (&overlap, &imm8)
6525 && !operand_type_equal (&overlap, &imm8s)
6526 && !operand_type_equal (&overlap, &imm16)
6527 && !operand_type_equal (&overlap, &imm32)
6528 && !operand_type_equal (&overlap, &imm32s)
6529 && !operand_type_equal (&overlap, &imm64))
6530 {
6531 if (i.suffix)
6532 {
6533 i386_operand_type temp;
6534
6535 operand_type_set (&temp, 0);
6536 if (i.suffix == BYTE_MNEM_SUFFIX)
6537 {
6538 temp.bitfield.imm8 = overlap.bitfield.imm8;
6539 temp.bitfield.imm8s = overlap.bitfield.imm8s;
6540 }
6541 else if (i.suffix == WORD_MNEM_SUFFIX)
6542 temp.bitfield.imm16 = overlap.bitfield.imm16;
6543 else if (i.suffix == QWORD_MNEM_SUFFIX)
6544 {
6545 temp.bitfield.imm64 = overlap.bitfield.imm64;
6546 temp.bitfield.imm32s = overlap.bitfield.imm32s;
6547 }
6548 else
6549 temp.bitfield.imm32 = overlap.bitfield.imm32;
6550 overlap = temp;
6551 }
6552 else if (operand_type_equal (&overlap, &imm16_32_32s)
6553 || operand_type_equal (&overlap, &imm16_32)
6554 || operand_type_equal (&overlap, &imm16_32s))
6555 {
6556 if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
6557 overlap = imm16;
6558 else
6559 overlap = imm32s;
6560 }
6561 if (!operand_type_equal (&overlap, &imm8)
6562 && !operand_type_equal (&overlap, &imm8s)
6563 && !operand_type_equal (&overlap, &imm16)
6564 && !operand_type_equal (&overlap, &imm32)
6565 && !operand_type_equal (&overlap, &imm32s)
6566 && !operand_type_equal (&overlap, &imm64))
6567 {
6568 as_bad (_("no instruction mnemonic suffix given; "
6569 "can't determine immediate size"));
6570 return 0;
6571 }
6572 }
6573 i.types[j] = overlap;
6574
6575 return 1;
6576 }
6577
6578 static int
6579 finalize_imm (void)
6580 {
6581 unsigned int j, n;
6582
6583 /* Update the first 2 immediate operands. */
6584 n = i.operands > 2 ? 2 : i.operands;
6585 if (n)
6586 {
6587 for (j = 0; j < n; j++)
6588 if (update_imm (j) == 0)
6589 return 0;
6590
6591 /* The 3rd operand can't be immediate operand. */
6592 gas_assert (operand_type_check (i.types[2], imm) == 0);
6593 }
6594
6595 return 1;
6596 }
6597
6598 static int
6599 process_operands (void)
6600 {
6601 /* Default segment register this instruction will use for memory
6602 accesses. 0 means unknown. This is only for optimizing out
6603 unnecessary segment overrides. */
6604 const seg_entry *default_seg = 0;
6605
6606 if (i.tm.opcode_modifier.sse2avx && i.tm.opcode_modifier.vexvvvv)
6607 {
6608 unsigned int dupl = i.operands;
6609 unsigned int dest = dupl - 1;
6610 unsigned int j;
6611
6612 /* The destination must be an xmm register. */
6613 gas_assert (i.reg_operands
6614 && MAX_OPERANDS > dupl
6615 && operand_type_equal (&i.types[dest], &regxmm));
6616
6617 if (i.tm.operand_types[0].bitfield.acc
6618 && i.tm.operand_types[0].bitfield.xmmword)
6619 {
6620 if (i.tm.opcode_modifier.vexsources == VEX3SOURCES)
6621 {
6622 /* Keep xmm0 for instructions with VEX prefix and 3
6623 sources. */
6624 i.tm.operand_types[0].bitfield.acc = 0;
6625 i.tm.operand_types[0].bitfield.regsimd = 1;
6626 goto duplicate;
6627 }
6628 else
6629 {
6630 /* We remove the first xmm0 and keep the number of
6631 operands unchanged, which in fact duplicates the
6632 destination. */
6633 for (j = 1; j < i.operands; j++)
6634 {
6635 i.op[j - 1] = i.op[j];
6636 i.types[j - 1] = i.types[j];
6637 i.tm.operand_types[j - 1] = i.tm.operand_types[j];
6638 }
6639 }
6640 }
6641 else if (i.tm.opcode_modifier.implicit1stxmm0)
6642 {
6643 gas_assert ((MAX_OPERANDS - 1) > dupl
6644 && (i.tm.opcode_modifier.vexsources
6645 == VEX3SOURCES));
6646
6647 /* Add the implicit xmm0 for instructions with VEX prefix
6648 and 3 sources. */
6649 for (j = i.operands; j > 0; j--)
6650 {
6651 i.op[j] = i.op[j - 1];
6652 i.types[j] = i.types[j - 1];
6653 i.tm.operand_types[j] = i.tm.operand_types[j - 1];
6654 }
6655 i.op[0].regs
6656 = (const reg_entry *) hash_find (reg_hash, "xmm0");
6657 i.types[0] = regxmm;
6658 i.tm.operand_types[0] = regxmm;
6659
6660 i.operands += 2;
6661 i.reg_operands += 2;
6662 i.tm.operands += 2;
6663
6664 dupl++;
6665 dest++;
6666 i.op[dupl] = i.op[dest];
6667 i.types[dupl] = i.types[dest];
6668 i.tm.operand_types[dupl] = i.tm.operand_types[dest];
6669 }
6670 else
6671 {
6672 duplicate:
6673 i.operands++;
6674 i.reg_operands++;
6675 i.tm.operands++;
6676
6677 i.op[dupl] = i.op[dest];
6678 i.types[dupl] = i.types[dest];
6679 i.tm.operand_types[dupl] = i.tm.operand_types[dest];
6680 }
6681
6682 if (i.tm.opcode_modifier.immext)
6683 process_immext ();
6684 }
6685 else if (i.tm.operand_types[0].bitfield.acc
6686 && i.tm.operand_types[0].bitfield.xmmword)
6687 {
6688 unsigned int j;
6689
6690 for (j = 1; j < i.operands; j++)
6691 {
6692 i.op[j - 1] = i.op[j];
6693 i.types[j - 1] = i.types[j];
6694
6695 /* We need to adjust fields in i.tm since they are used by
6696 build_modrm_byte. */
6697 i.tm.operand_types [j - 1] = i.tm.operand_types [j];
6698 }
6699
6700 i.operands--;
6701 i.reg_operands--;
6702 i.tm.operands--;
6703 }
6704 else if (i.tm.opcode_modifier.implicitquadgroup)
6705 {
6706 unsigned int regnum, first_reg_in_group, last_reg_in_group;
6707
6708 /* The second operand must be {x,y,z}mmN, where N is a multiple of 4. */
6709 gas_assert (i.operands >= 2 && i.types[1].bitfield.regsimd);
6710 regnum = register_number (i.op[1].regs);
6711 first_reg_in_group = regnum & ~3;
6712 last_reg_in_group = first_reg_in_group + 3;
6713 if (regnum != first_reg_in_group)
6714 as_warn (_("source register `%s%s' implicitly denotes"
6715 " `%s%.3s%u' to `%s%.3s%u' source group in `%s'"),
6716 register_prefix, i.op[1].regs->reg_name,
6717 register_prefix, i.op[1].regs->reg_name, first_reg_in_group,
6718 register_prefix, i.op[1].regs->reg_name, last_reg_in_group,
6719 i.tm.name);
6720 }
6721 else if (i.tm.opcode_modifier.regkludge)
6722 {
6723 /* The imul $imm, %reg instruction is converted into
6724 imul $imm, %reg, %reg, and the clr %reg instruction
6725 is converted into xor %reg, %reg. */
6726
6727 unsigned int first_reg_op;
6728
6729 if (operand_type_check (i.types[0], reg))
6730 first_reg_op = 0;
6731 else
6732 first_reg_op = 1;
6733 /* Pretend we saw the extra register operand. */
6734 gas_assert (i.reg_operands == 1
6735 && i.op[first_reg_op + 1].regs == 0);
6736 i.op[first_reg_op + 1].regs = i.op[first_reg_op].regs;
6737 i.types[first_reg_op + 1] = i.types[first_reg_op];
6738 i.operands++;
6739 i.reg_operands++;
6740 }
6741
6742 if (i.tm.opcode_modifier.shortform)
6743 {
6744 if (i.types[0].bitfield.sreg2
6745 || i.types[0].bitfield.sreg3)
6746 {
6747 if (i.tm.base_opcode == POP_SEG_SHORT
6748 && i.op[0].regs->reg_num == 1)
6749 {
6750 as_bad (_("you can't `pop %scs'"), register_prefix);
6751 return 0;
6752 }
6753 i.tm.base_opcode |= (i.op[0].regs->reg_num << 3);
6754 if ((i.op[0].regs->reg_flags & RegRex) != 0)
6755 i.rex |= REX_B;
6756 }
6757 else
6758 {
6759 /* The register or float register operand is in operand
6760 0 or 1. */
6761 unsigned int op;
6762
6763 if ((i.types[0].bitfield.reg && i.types[0].bitfield.tbyte)
6764 || operand_type_check (i.types[0], reg))
6765 op = 0;
6766 else
6767 op = 1;
6768 /* Register goes in low 3 bits of opcode. */
6769 i.tm.base_opcode |= i.op[op].regs->reg_num;
6770 if ((i.op[op].regs->reg_flags & RegRex) != 0)
6771 i.rex |= REX_B;
6772 if (!quiet_warnings && i.tm.opcode_modifier.ugh)
6773 {
6774 /* Warn about some common errors, but press on regardless.
6775 The first case can be generated by gcc (<= 2.8.1). */
6776 if (i.operands == 2)
6777 {
6778 /* Reversed arguments on faddp, fsubp, etc. */
6779 as_warn (_("translating to `%s %s%s,%s%s'"), i.tm.name,
6780 register_prefix, i.op[!intel_syntax].regs->reg_name,
6781 register_prefix, i.op[intel_syntax].regs->reg_name);
6782 }
6783 else
6784 {
6785 /* Extraneous `l' suffix on fp insn. */
6786 as_warn (_("translating to `%s %s%s'"), i.tm.name,
6787 register_prefix, i.op[0].regs->reg_name);
6788 }
6789 }
6790 }
6791 }
6792 else if (i.tm.opcode_modifier.modrm)
6793 {
6794 /* The opcode is completed (modulo i.tm.extension_opcode which
6795 must be put into the modrm byte). Now, we make the modrm and
6796 index base bytes based on all the info we've collected. */
6797
6798 default_seg = build_modrm_byte ();
6799 }
6800 else if ((i.tm.base_opcode & ~0x3) == MOV_AX_DISP32)
6801 {
6802 default_seg = &ds;
6803 }
6804 else if (i.tm.opcode_modifier.isstring)
6805 {
6806 /* For the string instructions that allow a segment override
6807 on one of their operands, the default segment is ds. */
6808 default_seg = &ds;
6809 }
6810
6811 if (i.tm.base_opcode == 0x8d /* lea */
6812 && i.seg[0]
6813 && !quiet_warnings)
6814 as_warn (_("segment override on `%s' is ineffectual"), i.tm.name);
6815
6816 /* If a segment was explicitly specified, and the specified segment
6817 is not the default, use an opcode prefix to select it. If we
6818 never figured out what the default segment is, then default_seg
6819 will be zero at this point, and the specified segment prefix will
6820 always be used. */
6821 if ((i.seg[0]) && (i.seg[0] != default_seg))
6822 {
6823 if (!add_prefix (i.seg[0]->seg_prefix))
6824 return 0;
6825 }
6826 return 1;
6827 }
6828
6829 static const seg_entry *
6830 build_modrm_byte (void)
6831 {
6832 const seg_entry *default_seg = 0;
6833 unsigned int source, dest;
6834 int vex_3_sources;
6835
6836 vex_3_sources = i.tm.opcode_modifier.vexsources == VEX3SOURCES;
6837 if (vex_3_sources)
6838 {
6839 unsigned int nds, reg_slot;
6840 expressionS *exp;
6841
6842 dest = i.operands - 1;
6843 nds = dest - 1;
6844
6845 /* There are 2 kinds of instructions:
6846 1. 5 operands: 4 register operands or 3 register operands
6847 plus 1 memory operand plus one Vec_Imm4 operand, VexXDS, and
6848 VexW0 or VexW1. The destination must be either XMM, YMM or
6849 ZMM register.
6850 2. 4 operands: 4 register operands or 3 register operands
6851 plus 1 memory operand, with VexXDS. */
6852 gas_assert ((i.reg_operands == 4
6853 || (i.reg_operands == 3 && i.mem_operands == 1))
6854 && i.tm.opcode_modifier.vexvvvv == VEXXDS
6855 && i.tm.opcode_modifier.vexw
6856 && i.tm.operand_types[dest].bitfield.regsimd);
6857
6858 /* If VexW1 is set, the first non-immediate operand is the source and
6859 the second non-immediate one is encoded in the immediate operand. */
6860 if (i.tm.opcode_modifier.vexw == VEXW1)
6861 {
6862 source = i.imm_operands;
6863 reg_slot = i.imm_operands + 1;
6864 }
6865 else
6866 {
6867 source = i.imm_operands + 1;
6868 reg_slot = i.imm_operands;
6869 }
6870
6871 if (i.imm_operands == 0)
6872 {
6873 /* When there is no immediate operand, generate an 8bit
6874 immediate operand to encode the first operand. */
6875 exp = &im_expressions[i.imm_operands++];
6876 i.op[i.operands].imms = exp;
6877 i.types[i.operands] = imm8;
6878 i.operands++;
6879
6880 gas_assert (i.tm.operand_types[reg_slot].bitfield.regsimd);
6881 exp->X_op = O_constant;
6882 exp->X_add_number = register_number (i.op[reg_slot].regs) << 4;
6883 gas_assert ((i.op[reg_slot].regs->reg_flags & RegVRex) == 0);
6884 }
6885 else
6886 {
6887 unsigned int imm_slot;
6888
6889 gas_assert (i.imm_operands == 1 && i.types[0].bitfield.vec_imm4);
6890
6891 if (i.tm.opcode_modifier.immext)
6892 {
6893 /* When ImmExt is set, the immediate byte is the last
6894 operand. */
6895 imm_slot = i.operands - 1;
6896 source--;
6897 reg_slot--;
6898 }
6899 else
6900 {
6901 imm_slot = 0;
6902
6903 /* Turn on Imm8 so that output_imm will generate it. */
6904 i.types[imm_slot].bitfield.imm8 = 1;
6905 }
6906
6907 gas_assert (i.tm.operand_types[reg_slot].bitfield.regsimd);
6908 i.op[imm_slot].imms->X_add_number
6909 |= register_number (i.op[reg_slot].regs) << 4;
6910 gas_assert ((i.op[reg_slot].regs->reg_flags & RegVRex) == 0);
6911 }
6912
6913 gas_assert (i.tm.operand_types[nds].bitfield.regsimd);
6914 i.vex.register_specifier = i.op[nds].regs;
6915 }
6916 else
6917 source = dest = 0;
6918
6919 /* i.reg_operands MUST be the number of real register operands;
6920 implicit registers do not count. If there are 3 register
6921 operands, it must be a instruction with VexNDS. For a
6922 instruction with VexNDD, the destination register is encoded
6923 in VEX prefix. If there are 4 register operands, it must be
6924 a instruction with VEX prefix and 3 sources. */
6925 if (i.mem_operands == 0
6926 && ((i.reg_operands == 2
6927 && i.tm.opcode_modifier.vexvvvv <= VEXXDS)
6928 || (i.reg_operands == 3
6929 && i.tm.opcode_modifier.vexvvvv == VEXXDS)
6930 || (i.reg_operands == 4 && vex_3_sources)))
6931 {
6932 switch (i.operands)
6933 {
6934 case 2:
6935 source = 0;
6936 break;
6937 case 3:
6938 /* When there are 3 operands, one of them may be immediate,
6939 which may be the first or the last operand. Otherwise,
6940 the first operand must be shift count register (cl) or it
6941 is an instruction with VexNDS. */
6942 gas_assert (i.imm_operands == 1
6943 || (i.imm_operands == 0
6944 && (i.tm.opcode_modifier.vexvvvv == VEXXDS
6945 || i.types[0].bitfield.shiftcount)));
6946 if (operand_type_check (i.types[0], imm)
6947 || i.types[0].bitfield.shiftcount)
6948 source = 1;
6949 else
6950 source = 0;
6951 break;
6952 case 4:
6953 /* When there are 4 operands, the first two must be 8bit
6954 immediate operands. The source operand will be the 3rd
6955 one.
6956
6957 For instructions with VexNDS, if the first operand
6958 an imm8, the source operand is the 2nd one. If the last
6959 operand is imm8, the source operand is the first one. */
6960 gas_assert ((i.imm_operands == 2
6961 && i.types[0].bitfield.imm8
6962 && i.types[1].bitfield.imm8)
6963 || (i.tm.opcode_modifier.vexvvvv == VEXXDS
6964 && i.imm_operands == 1
6965 && (i.types[0].bitfield.imm8
6966 || i.types[i.operands - 1].bitfield.imm8
6967 || i.rounding)));
6968 if (i.imm_operands == 2)
6969 source = 2;
6970 else
6971 {
6972 if (i.types[0].bitfield.imm8)
6973 source = 1;
6974 else
6975 source = 0;
6976 }
6977 break;
6978 case 5:
6979 if (is_evex_encoding (&i.tm))
6980 {
6981 /* For EVEX instructions, when there are 5 operands, the
6982 first one must be immediate operand. If the second one
6983 is immediate operand, the source operand is the 3th
6984 one. If the last one is immediate operand, the source
6985 operand is the 2nd one. */
6986 gas_assert (i.imm_operands == 2
6987 && i.tm.opcode_modifier.sae
6988 && operand_type_check (i.types[0], imm));
6989 if (operand_type_check (i.types[1], imm))
6990 source = 2;
6991 else if (operand_type_check (i.types[4], imm))
6992 source = 1;
6993 else
6994 abort ();
6995 }
6996 break;
6997 default:
6998 abort ();
6999 }
7000
7001 if (!vex_3_sources)
7002 {
7003 dest = source + 1;
7004
7005 /* RC/SAE operand could be between DEST and SRC. That happens
7006 when one operand is GPR and the other one is XMM/YMM/ZMM
7007 register. */
7008 if (i.rounding && i.rounding->operand == (int) dest)
7009 dest++;
7010
7011 if (i.tm.opcode_modifier.vexvvvv == VEXXDS)
7012 {
7013 /* For instructions with VexNDS, the register-only source
7014 operand must be a 32/64bit integer, XMM, YMM, ZMM, or mask
7015 register. It is encoded in VEX prefix. We need to
7016 clear RegMem bit before calling operand_type_equal. */
7017
7018 i386_operand_type op;
7019 unsigned int vvvv;
7020
7021 /* Check register-only source operand when two source
7022 operands are swapped. */
7023 if (!i.tm.operand_types[source].bitfield.baseindex
7024 && i.tm.operand_types[dest].bitfield.baseindex)
7025 {
7026 vvvv = source;
7027 source = dest;
7028 }
7029 else
7030 vvvv = dest;
7031
7032 op = i.tm.operand_types[vvvv];
7033 op.bitfield.regmem = 0;
7034 if ((dest + 1) >= i.operands
7035 || ((!op.bitfield.reg
7036 || (!op.bitfield.dword && !op.bitfield.qword))
7037 && !op.bitfield.regsimd
7038 && !operand_type_equal (&op, &regmask)))
7039 abort ();
7040 i.vex.register_specifier = i.op[vvvv].regs;
7041 dest++;
7042 }
7043 }
7044
7045 i.rm.mode = 3;
7046 /* One of the register operands will be encoded in the i.tm.reg
7047 field, the other in the combined i.tm.mode and i.tm.regmem
7048 fields. If no form of this instruction supports a memory
7049 destination operand, then we assume the source operand may
7050 sometimes be a memory operand and so we need to store the
7051 destination in the i.rm.reg field. */
7052 if (!i.tm.operand_types[dest].bitfield.regmem
7053 && operand_type_check (i.tm.operand_types[dest], anymem) == 0)
7054 {
7055 i.rm.reg = i.op[dest].regs->reg_num;
7056 i.rm.regmem = i.op[source].regs->reg_num;
7057 if ((i.op[dest].regs->reg_flags & RegRex) != 0)
7058 i.rex |= REX_R;
7059 if ((i.op[dest].regs->reg_flags & RegVRex) != 0)
7060 i.vrex |= REX_R;
7061 if ((i.op[source].regs->reg_flags & RegRex) != 0)
7062 i.rex |= REX_B;
7063 if ((i.op[source].regs->reg_flags & RegVRex) != 0)
7064 i.vrex |= REX_B;
7065 }
7066 else
7067 {
7068 i.rm.reg = i.op[source].regs->reg_num;
7069 i.rm.regmem = i.op[dest].regs->reg_num;
7070 if ((i.op[dest].regs->reg_flags & RegRex) != 0)
7071 i.rex |= REX_B;
7072 if ((i.op[dest].regs->reg_flags & RegVRex) != 0)
7073 i.vrex |= REX_B;
7074 if ((i.op[source].regs->reg_flags & RegRex) != 0)
7075 i.rex |= REX_R;
7076 if ((i.op[source].regs->reg_flags & RegVRex) != 0)
7077 i.vrex |= REX_R;
7078 }
7079 if (flag_code != CODE_64BIT && (i.rex & REX_R))
7080 {
7081 if (!i.types[i.tm.operand_types[0].bitfield.regmem].bitfield.control)
7082 abort ();
7083 i.rex &= ~REX_R;
7084 add_prefix (LOCK_PREFIX_OPCODE);
7085 }
7086 }
7087 else
7088 { /* If it's not 2 reg operands... */
7089 unsigned int mem;
7090
7091 if (i.mem_operands)
7092 {
7093 unsigned int fake_zero_displacement = 0;
7094 unsigned int op;
7095
7096 for (op = 0; op < i.operands; op++)
7097 if (operand_type_check (i.types[op], anymem))
7098 break;
7099 gas_assert (op < i.operands);
7100
7101 if (i.tm.opcode_modifier.vecsib)
7102 {
7103 if (i.index_reg->reg_num == RegIZ)
7104 abort ();
7105
7106 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
7107 if (!i.base_reg)
7108 {
7109 i.sib.base = NO_BASE_REGISTER;
7110 i.sib.scale = i.log2_scale_factor;
7111 i.types[op].bitfield.disp8 = 0;
7112 i.types[op].bitfield.disp16 = 0;
7113 i.types[op].bitfield.disp64 = 0;
7114 if (flag_code != CODE_64BIT || i.prefix[ADDR_PREFIX])
7115 {
7116 /* Must be 32 bit */
7117 i.types[op].bitfield.disp32 = 1;
7118 i.types[op].bitfield.disp32s = 0;
7119 }
7120 else
7121 {
7122 i.types[op].bitfield.disp32 = 0;
7123 i.types[op].bitfield.disp32s = 1;
7124 }
7125 }
7126 i.sib.index = i.index_reg->reg_num;
7127 if ((i.index_reg->reg_flags & RegRex) != 0)
7128 i.rex |= REX_X;
7129 if ((i.index_reg->reg_flags & RegVRex) != 0)
7130 i.vrex |= REX_X;
7131 }
7132
7133 default_seg = &ds;
7134
7135 if (i.base_reg == 0)
7136 {
7137 i.rm.mode = 0;
7138 if (!i.disp_operands)
7139 fake_zero_displacement = 1;
7140 if (i.index_reg == 0)
7141 {
7142 i386_operand_type newdisp;
7143
7144 gas_assert (!i.tm.opcode_modifier.vecsib);
7145 /* Operand is just <disp> */
7146 if (flag_code == CODE_64BIT)
7147 {
7148 /* 64bit mode overwrites the 32bit absolute
7149 addressing by RIP relative addressing and
7150 absolute addressing is encoded by one of the
7151 redundant SIB forms. */
7152 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
7153 i.sib.base = NO_BASE_REGISTER;
7154 i.sib.index = NO_INDEX_REGISTER;
7155 newdisp = (!i.prefix[ADDR_PREFIX] ? disp32s : disp32);
7156 }
7157 else if ((flag_code == CODE_16BIT)
7158 ^ (i.prefix[ADDR_PREFIX] != 0))
7159 {
7160 i.rm.regmem = NO_BASE_REGISTER_16;
7161 newdisp = disp16;
7162 }
7163 else
7164 {
7165 i.rm.regmem = NO_BASE_REGISTER;
7166 newdisp = disp32;
7167 }
7168 i.types[op] = operand_type_and_not (i.types[op], anydisp);
7169 i.types[op] = operand_type_or (i.types[op], newdisp);
7170 }
7171 else if (!i.tm.opcode_modifier.vecsib)
7172 {
7173 /* !i.base_reg && i.index_reg */
7174 if (i.index_reg->reg_num == RegIZ)
7175 i.sib.index = NO_INDEX_REGISTER;
7176 else
7177 i.sib.index = i.index_reg->reg_num;
7178 i.sib.base = NO_BASE_REGISTER;
7179 i.sib.scale = i.log2_scale_factor;
7180 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
7181 i.types[op].bitfield.disp8 = 0;
7182 i.types[op].bitfield.disp16 = 0;
7183 i.types[op].bitfield.disp64 = 0;
7184 if (flag_code != CODE_64BIT || i.prefix[ADDR_PREFIX])
7185 {
7186 /* Must be 32 bit */
7187 i.types[op].bitfield.disp32 = 1;
7188 i.types[op].bitfield.disp32s = 0;
7189 }
7190 else
7191 {
7192 i.types[op].bitfield.disp32 = 0;
7193 i.types[op].bitfield.disp32s = 1;
7194 }
7195 if ((i.index_reg->reg_flags & RegRex) != 0)
7196 i.rex |= REX_X;
7197 }
7198 }
7199 /* RIP addressing for 64bit mode. */
7200 else if (i.base_reg->reg_num == RegIP)
7201 {
7202 gas_assert (!i.tm.opcode_modifier.vecsib);
7203 i.rm.regmem = NO_BASE_REGISTER;
7204 i.types[op].bitfield.disp8 = 0;
7205 i.types[op].bitfield.disp16 = 0;
7206 i.types[op].bitfield.disp32 = 0;
7207 i.types[op].bitfield.disp32s = 1;
7208 i.types[op].bitfield.disp64 = 0;
7209 i.flags[op] |= Operand_PCrel;
7210 if (! i.disp_operands)
7211 fake_zero_displacement = 1;
7212 }
7213 else if (i.base_reg->reg_type.bitfield.word)
7214 {
7215 gas_assert (!i.tm.opcode_modifier.vecsib);
7216 switch (i.base_reg->reg_num)
7217 {
7218 case 3: /* (%bx) */
7219 if (i.index_reg == 0)
7220 i.rm.regmem = 7;
7221 else /* (%bx,%si) -> 0, or (%bx,%di) -> 1 */
7222 i.rm.regmem = i.index_reg->reg_num - 6;
7223 break;
7224 case 5: /* (%bp) */
7225 default_seg = &ss;
7226 if (i.index_reg == 0)
7227 {
7228 i.rm.regmem = 6;
7229 if (operand_type_check (i.types[op], disp) == 0)
7230 {
7231 /* fake (%bp) into 0(%bp) */
7232 i.types[op].bitfield.disp8 = 1;
7233 fake_zero_displacement = 1;
7234 }
7235 }
7236 else /* (%bp,%si) -> 2, or (%bp,%di) -> 3 */
7237 i.rm.regmem = i.index_reg->reg_num - 6 + 2;
7238 break;
7239 default: /* (%si) -> 4 or (%di) -> 5 */
7240 i.rm.regmem = i.base_reg->reg_num - 6 + 4;
7241 }
7242 i.rm.mode = mode_from_disp_size (i.types[op]);
7243 }
7244 else /* i.base_reg and 32/64 bit mode */
7245 {
7246 if (flag_code == CODE_64BIT
7247 && operand_type_check (i.types[op], disp))
7248 {
7249 i.types[op].bitfield.disp16 = 0;
7250 i.types[op].bitfield.disp64 = 0;
7251 if (i.prefix[ADDR_PREFIX] == 0)
7252 {
7253 i.types[op].bitfield.disp32 = 0;
7254 i.types[op].bitfield.disp32s = 1;
7255 }
7256 else
7257 {
7258 i.types[op].bitfield.disp32 = 1;
7259 i.types[op].bitfield.disp32s = 0;
7260 }
7261 }
7262
7263 if (!i.tm.opcode_modifier.vecsib)
7264 i.rm.regmem = i.base_reg->reg_num;
7265 if ((i.base_reg->reg_flags & RegRex) != 0)
7266 i.rex |= REX_B;
7267 i.sib.base = i.base_reg->reg_num;
7268 /* x86-64 ignores REX prefix bit here to avoid decoder
7269 complications. */
7270 if (!(i.base_reg->reg_flags & RegRex)
7271 && (i.base_reg->reg_num == EBP_REG_NUM
7272 || i.base_reg->reg_num == ESP_REG_NUM))
7273 default_seg = &ss;
7274 if (i.base_reg->reg_num == 5 && i.disp_operands == 0)
7275 {
7276 fake_zero_displacement = 1;
7277 i.types[op].bitfield.disp8 = 1;
7278 }
7279 i.sib.scale = i.log2_scale_factor;
7280 if (i.index_reg == 0)
7281 {
7282 gas_assert (!i.tm.opcode_modifier.vecsib);
7283 /* <disp>(%esp) becomes two byte modrm with no index
7284 register. We've already stored the code for esp
7285 in i.rm.regmem ie. ESCAPE_TO_TWO_BYTE_ADDRESSING.
7286 Any base register besides %esp will not use the
7287 extra modrm byte. */
7288 i.sib.index = NO_INDEX_REGISTER;
7289 }
7290 else if (!i.tm.opcode_modifier.vecsib)
7291 {
7292 if (i.index_reg->reg_num == RegIZ)
7293 i.sib.index = NO_INDEX_REGISTER;
7294 else
7295 i.sib.index = i.index_reg->reg_num;
7296 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
7297 if ((i.index_reg->reg_flags & RegRex) != 0)
7298 i.rex |= REX_X;
7299 }
7300
7301 if (i.disp_operands
7302 && (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
7303 || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL))
7304 i.rm.mode = 0;
7305 else
7306 {
7307 if (!fake_zero_displacement
7308 && !i.disp_operands
7309 && i.disp_encoding)
7310 {
7311 fake_zero_displacement = 1;
7312 if (i.disp_encoding == disp_encoding_8bit)
7313 i.types[op].bitfield.disp8 = 1;
7314 else
7315 i.types[op].bitfield.disp32 = 1;
7316 }
7317 i.rm.mode = mode_from_disp_size (i.types[op]);
7318 }
7319 }
7320
7321 if (fake_zero_displacement)
7322 {
7323 /* Fakes a zero displacement assuming that i.types[op]
7324 holds the correct displacement size. */
7325 expressionS *exp;
7326
7327 gas_assert (i.op[op].disps == 0);
7328 exp = &disp_expressions[i.disp_operands++];
7329 i.op[op].disps = exp;
7330 exp->X_op = O_constant;
7331 exp->X_add_number = 0;
7332 exp->X_add_symbol = (symbolS *) 0;
7333 exp->X_op_symbol = (symbolS *) 0;
7334 }
7335
7336 mem = op;
7337 }
7338 else
7339 mem = ~0;
7340
7341 if (i.tm.opcode_modifier.vexsources == XOP2SOURCES)
7342 {
7343 if (operand_type_check (i.types[0], imm))
7344 i.vex.register_specifier = NULL;
7345 else
7346 {
7347 /* VEX.vvvv encodes one of the sources when the first
7348 operand is not an immediate. */
7349 if (i.tm.opcode_modifier.vexw == VEXW0)
7350 i.vex.register_specifier = i.op[0].regs;
7351 else
7352 i.vex.register_specifier = i.op[1].regs;
7353 }
7354
7355 /* Destination is a XMM register encoded in the ModRM.reg
7356 and VEX.R bit. */
7357 i.rm.reg = i.op[2].regs->reg_num;
7358 if ((i.op[2].regs->reg_flags & RegRex) != 0)
7359 i.rex |= REX_R;
7360
7361 /* ModRM.rm and VEX.B encodes the other source. */
7362 if (!i.mem_operands)
7363 {
7364 i.rm.mode = 3;
7365
7366 if (i.tm.opcode_modifier.vexw == VEXW0)
7367 i.rm.regmem = i.op[1].regs->reg_num;
7368 else
7369 i.rm.regmem = i.op[0].regs->reg_num;
7370
7371 if ((i.op[1].regs->reg_flags & RegRex) != 0)
7372 i.rex |= REX_B;
7373 }
7374 }
7375 else if (i.tm.opcode_modifier.vexvvvv == VEXLWP)
7376 {
7377 i.vex.register_specifier = i.op[2].regs;
7378 if (!i.mem_operands)
7379 {
7380 i.rm.mode = 3;
7381 i.rm.regmem = i.op[1].regs->reg_num;
7382 if ((i.op[1].regs->reg_flags & RegRex) != 0)
7383 i.rex |= REX_B;
7384 }
7385 }
7386 /* Fill in i.rm.reg or i.rm.regmem field with register operand
7387 (if any) based on i.tm.extension_opcode. Again, we must be
7388 careful to make sure that segment/control/debug/test/MMX
7389 registers are coded into the i.rm.reg field. */
7390 else if (i.reg_operands)
7391 {
7392 unsigned int op;
7393 unsigned int vex_reg = ~0;
7394
7395 for (op = 0; op < i.operands; op++)
7396 if (i.types[op].bitfield.reg
7397 || i.types[op].bitfield.regmmx
7398 || i.types[op].bitfield.regsimd
7399 || i.types[op].bitfield.regbnd
7400 || i.types[op].bitfield.regmask
7401 || i.types[op].bitfield.sreg2
7402 || i.types[op].bitfield.sreg3
7403 || i.types[op].bitfield.control
7404 || i.types[op].bitfield.debug
7405 || i.types[op].bitfield.test)
7406 break;
7407
7408 if (vex_3_sources)
7409 op = dest;
7410 else if (i.tm.opcode_modifier.vexvvvv == VEXXDS)
7411 {
7412 /* For instructions with VexNDS, the register-only
7413 source operand is encoded in VEX prefix. */
7414 gas_assert (mem != (unsigned int) ~0);
7415
7416 if (op > mem)
7417 {
7418 vex_reg = op++;
7419 gas_assert (op < i.operands);
7420 }
7421 else
7422 {
7423 /* Check register-only source operand when two source
7424 operands are swapped. */
7425 if (!i.tm.operand_types[op].bitfield.baseindex
7426 && i.tm.operand_types[op + 1].bitfield.baseindex)
7427 {
7428 vex_reg = op;
7429 op += 2;
7430 gas_assert (mem == (vex_reg + 1)
7431 && op < i.operands);
7432 }
7433 else
7434 {
7435 vex_reg = op + 1;
7436 gas_assert (vex_reg < i.operands);
7437 }
7438 }
7439 }
7440 else if (i.tm.opcode_modifier.vexvvvv == VEXNDD)
7441 {
7442 /* For instructions with VexNDD, the register destination
7443 is encoded in VEX prefix. */
7444 if (i.mem_operands == 0)
7445 {
7446 /* There is no memory operand. */
7447 gas_assert ((op + 2) == i.operands);
7448 vex_reg = op + 1;
7449 }
7450 else
7451 {
7452 /* There are only 2 non-immediate operands. */
7453 gas_assert (op < i.imm_operands + 2
7454 && i.operands == i.imm_operands + 2);
7455 vex_reg = i.imm_operands + 1;
7456 }
7457 }
7458 else
7459 gas_assert (op < i.operands);
7460
7461 if (vex_reg != (unsigned int) ~0)
7462 {
7463 i386_operand_type *type = &i.tm.operand_types[vex_reg];
7464
7465 if ((!type->bitfield.reg
7466 || (!type->bitfield.dword && !type->bitfield.qword))
7467 && !type->bitfield.regsimd
7468 && !operand_type_equal (type, &regmask))
7469 abort ();
7470
7471 i.vex.register_specifier = i.op[vex_reg].regs;
7472 }
7473
7474 /* Don't set OP operand twice. */
7475 if (vex_reg != op)
7476 {
7477 /* If there is an extension opcode to put here, the
7478 register number must be put into the regmem field. */
7479 if (i.tm.extension_opcode != None)
7480 {
7481 i.rm.regmem = i.op[op].regs->reg_num;
7482 if ((i.op[op].regs->reg_flags & RegRex) != 0)
7483 i.rex |= REX_B;
7484 if ((i.op[op].regs->reg_flags & RegVRex) != 0)
7485 i.vrex |= REX_B;
7486 }
7487 else
7488 {
7489 i.rm.reg = i.op[op].regs->reg_num;
7490 if ((i.op[op].regs->reg_flags & RegRex) != 0)
7491 i.rex |= REX_R;
7492 if ((i.op[op].regs->reg_flags & RegVRex) != 0)
7493 i.vrex |= REX_R;
7494 }
7495 }
7496
7497 /* Now, if no memory operand has set i.rm.mode = 0, 1, 2 we
7498 must set it to 3 to indicate this is a register operand
7499 in the regmem field. */
7500 if (!i.mem_operands)
7501 i.rm.mode = 3;
7502 }
7503
7504 /* Fill in i.rm.reg field with extension opcode (if any). */
7505 if (i.tm.extension_opcode != None)
7506 i.rm.reg = i.tm.extension_opcode;
7507 }
7508 return default_seg;
7509 }
7510
7511 static void
7512 output_branch (void)
7513 {
7514 char *p;
7515 int size;
7516 int code16;
7517 int prefix;
7518 relax_substateT subtype;
7519 symbolS *sym;
7520 offsetT off;
7521
7522 code16 = flag_code == CODE_16BIT ? CODE16 : 0;
7523 size = i.disp_encoding == disp_encoding_32bit ? BIG : SMALL;
7524
7525 prefix = 0;
7526 if (i.prefix[DATA_PREFIX] != 0)
7527 {
7528 prefix = 1;
7529 i.prefixes -= 1;
7530 code16 ^= CODE16;
7531 }
7532 /* Pentium4 branch hints. */
7533 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
7534 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
7535 {
7536 prefix++;
7537 i.prefixes--;
7538 }
7539 if (i.prefix[REX_PREFIX] != 0)
7540 {
7541 prefix++;
7542 i.prefixes--;
7543 }
7544
7545 /* BND prefixed jump. */
7546 if (i.prefix[BND_PREFIX] != 0)
7547 {
7548 FRAG_APPEND_1_CHAR (i.prefix[BND_PREFIX]);
7549 i.prefixes -= 1;
7550 }
7551
7552 if (i.prefixes != 0 && !intel_syntax)
7553 as_warn (_("skipping prefixes on this instruction"));
7554
7555 /* It's always a symbol; End frag & setup for relax.
7556 Make sure there is enough room in this frag for the largest
7557 instruction we may generate in md_convert_frag. This is 2
7558 bytes for the opcode and room for the prefix and largest
7559 displacement. */
7560 frag_grow (prefix + 2 + 4);
7561 /* Prefix and 1 opcode byte go in fr_fix. */
7562 p = frag_more (prefix + 1);
7563 if (i.prefix[DATA_PREFIX] != 0)
7564 *p++ = DATA_PREFIX_OPCODE;
7565 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE
7566 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE)
7567 *p++ = i.prefix[SEG_PREFIX];
7568 if (i.prefix[REX_PREFIX] != 0)
7569 *p++ = i.prefix[REX_PREFIX];
7570 *p = i.tm.base_opcode;
7571
7572 if ((unsigned char) *p == JUMP_PC_RELATIVE)
7573 subtype = ENCODE_RELAX_STATE (UNCOND_JUMP, size);
7574 else if (cpu_arch_flags.bitfield.cpui386)
7575 subtype = ENCODE_RELAX_STATE (COND_JUMP, size);
7576 else
7577 subtype = ENCODE_RELAX_STATE (COND_JUMP86, size);
7578 subtype |= code16;
7579
7580 sym = i.op[0].disps->X_add_symbol;
7581 off = i.op[0].disps->X_add_number;
7582
7583 if (i.op[0].disps->X_op != O_constant
7584 && i.op[0].disps->X_op != O_symbol)
7585 {
7586 /* Handle complex expressions. */
7587 sym = make_expr_symbol (i.op[0].disps);
7588 off = 0;
7589 }
7590
7591 /* 1 possible extra opcode + 4 byte displacement go in var part.
7592 Pass reloc in fr_var. */
7593 frag_var (rs_machine_dependent, 5, i.reloc[0], subtype, sym, off, p);
7594 }
7595
7596 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
7597 /* Return TRUE iff PLT32 relocation should be used for branching to
7598 symbol S. */
7599
7600 static bfd_boolean
7601 need_plt32_p (symbolS *s)
7602 {
7603 /* PLT32 relocation is ELF only. */
7604 if (!IS_ELF)
7605 return FALSE;
7606
7607 /* Since there is no need to prepare for PLT branch on x86-64, we
7608 can generate R_X86_64_PLT32, instead of R_X86_64_PC32, which can
7609 be used as a marker for 32-bit PC-relative branches. */
7610 if (!object_64bit)
7611 return FALSE;
7612
7613 /* Weak or undefined symbol need PLT32 relocation. */
7614 if (S_IS_WEAK (s) || !S_IS_DEFINED (s))
7615 return TRUE;
7616
7617 /* Non-global symbol doesn't need PLT32 relocation. */
7618 if (! S_IS_EXTERNAL (s))
7619 return FALSE;
7620
7621 /* Other global symbols need PLT32 relocation. NB: Symbol with
7622 non-default visibilities are treated as normal global symbol
7623 so that PLT32 relocation can be used as a marker for 32-bit
7624 PC-relative branches. It is useful for linker relaxation. */
7625 return TRUE;
7626 }
7627 #endif
7628
7629 static void
7630 output_jump (void)
7631 {
7632 char *p;
7633 int size;
7634 fixS *fixP;
7635 bfd_reloc_code_real_type jump_reloc = i.reloc[0];
7636
7637 if (i.tm.opcode_modifier.jumpbyte)
7638 {
7639 /* This is a loop or jecxz type instruction. */
7640 size = 1;
7641 if (i.prefix[ADDR_PREFIX] != 0)
7642 {
7643 FRAG_APPEND_1_CHAR (ADDR_PREFIX_OPCODE);
7644 i.prefixes -= 1;
7645 }
7646 /* Pentium4 branch hints. */
7647 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
7648 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
7649 {
7650 FRAG_APPEND_1_CHAR (i.prefix[SEG_PREFIX]);
7651 i.prefixes--;
7652 }
7653 }
7654 else
7655 {
7656 int code16;
7657
7658 code16 = 0;
7659 if (flag_code == CODE_16BIT)
7660 code16 = CODE16;
7661
7662 if (i.prefix[DATA_PREFIX] != 0)
7663 {
7664 FRAG_APPEND_1_CHAR (DATA_PREFIX_OPCODE);
7665 i.prefixes -= 1;
7666 code16 ^= CODE16;
7667 }
7668
7669 size = 4;
7670 if (code16)
7671 size = 2;
7672 }
7673
7674 if (i.prefix[REX_PREFIX] != 0)
7675 {
7676 FRAG_APPEND_1_CHAR (i.prefix[REX_PREFIX]);
7677 i.prefixes -= 1;
7678 }
7679
7680 /* BND prefixed jump. */
7681 if (i.prefix[BND_PREFIX] != 0)
7682 {
7683 FRAG_APPEND_1_CHAR (i.prefix[BND_PREFIX]);
7684 i.prefixes -= 1;
7685 }
7686
7687 if (i.prefixes != 0 && !intel_syntax)
7688 as_warn (_("skipping prefixes on this instruction"));
7689
7690 p = frag_more (i.tm.opcode_length + size);
7691 switch (i.tm.opcode_length)
7692 {
7693 case 2:
7694 *p++ = i.tm.base_opcode >> 8;
7695 /* Fall through. */
7696 case 1:
7697 *p++ = i.tm.base_opcode;
7698 break;
7699 default:
7700 abort ();
7701 }
7702
7703 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
7704 if (size == 4
7705 && jump_reloc == NO_RELOC
7706 && need_plt32_p (i.op[0].disps->X_add_symbol))
7707 jump_reloc = BFD_RELOC_X86_64_PLT32;
7708 #endif
7709
7710 jump_reloc = reloc (size, 1, 1, jump_reloc);
7711
7712 fixP = fix_new_exp (frag_now, p - frag_now->fr_literal, size,
7713 i.op[0].disps, 1, jump_reloc);
7714
7715 /* All jumps handled here are signed, but don't use a signed limit
7716 check for 32 and 16 bit jumps as we want to allow wrap around at
7717 4G and 64k respectively. */
7718 if (size == 1)
7719 fixP->fx_signed = 1;
7720 }
7721
7722 static void
7723 output_interseg_jump (void)
7724 {
7725 char *p;
7726 int size;
7727 int prefix;
7728 int code16;
7729
7730 code16 = 0;
7731 if (flag_code == CODE_16BIT)
7732 code16 = CODE16;
7733
7734 prefix = 0;
7735 if (i.prefix[DATA_PREFIX] != 0)
7736 {
7737 prefix = 1;
7738 i.prefixes -= 1;
7739 code16 ^= CODE16;
7740 }
7741 if (i.prefix[REX_PREFIX] != 0)
7742 {
7743 prefix++;
7744 i.prefixes -= 1;
7745 }
7746
7747 size = 4;
7748 if (code16)
7749 size = 2;
7750
7751 if (i.prefixes != 0 && !intel_syntax)
7752 as_warn (_("skipping prefixes on this instruction"));
7753
7754 /* 1 opcode; 2 segment; offset */
7755 p = frag_more (prefix + 1 + 2 + size);
7756
7757 if (i.prefix[DATA_PREFIX] != 0)
7758 *p++ = DATA_PREFIX_OPCODE;
7759
7760 if (i.prefix[REX_PREFIX] != 0)
7761 *p++ = i.prefix[REX_PREFIX];
7762
7763 *p++ = i.tm.base_opcode;
7764 if (i.op[1].imms->X_op == O_constant)
7765 {
7766 offsetT n = i.op[1].imms->X_add_number;
7767
7768 if (size == 2
7769 && !fits_in_unsigned_word (n)
7770 && !fits_in_signed_word (n))
7771 {
7772 as_bad (_("16-bit jump out of range"));
7773 return;
7774 }
7775 md_number_to_chars (p, n, size);
7776 }
7777 else
7778 fix_new_exp (frag_now, p - frag_now->fr_literal, size,
7779 i.op[1].imms, 0, reloc (size, 0, 0, i.reloc[1]));
7780 if (i.op[0].imms->X_op != O_constant)
7781 as_bad (_("can't handle non absolute segment in `%s'"),
7782 i.tm.name);
7783 md_number_to_chars (p + size, (valueT) i.op[0].imms->X_add_number, 2);
7784 }
7785
7786 static void
7787 output_insn (void)
7788 {
7789 fragS *insn_start_frag;
7790 offsetT insn_start_off;
7791
7792 /* Tie dwarf2 debug info to the address at the start of the insn.
7793 We can't do this after the insn has been output as the current
7794 frag may have been closed off. eg. by frag_var. */
7795 dwarf2_emit_insn (0);
7796
7797 insn_start_frag = frag_now;
7798 insn_start_off = frag_now_fix ();
7799
7800 /* Output jumps. */
7801 if (i.tm.opcode_modifier.jump)
7802 output_branch ();
7803 else if (i.tm.opcode_modifier.jumpbyte
7804 || i.tm.opcode_modifier.jumpdword)
7805 output_jump ();
7806 else if (i.tm.opcode_modifier.jumpintersegment)
7807 output_interseg_jump ();
7808 else
7809 {
7810 /* Output normal instructions here. */
7811 char *p;
7812 unsigned char *q;
7813 unsigned int j;
7814 unsigned int prefix;
7815
7816 if (avoid_fence
7817 && i.tm.base_opcode == 0xfae
7818 && i.operands == 1
7819 && i.imm_operands == 1
7820 && (i.op[0].imms->X_add_number == 0xe8
7821 || i.op[0].imms->X_add_number == 0xf0
7822 || i.op[0].imms->X_add_number == 0xf8))
7823 {
7824 /* Encode lfence, mfence, and sfence as
7825 f0 83 04 24 00 lock addl $0x0, (%{re}sp). */
7826 offsetT val = 0x240483f0ULL;
7827 p = frag_more (5);
7828 md_number_to_chars (p, val, 5);
7829 return;
7830 }
7831
7832 /* Some processors fail on LOCK prefix. This options makes
7833 assembler ignore LOCK prefix and serves as a workaround. */
7834 if (omit_lock_prefix)
7835 {
7836 if (i.tm.base_opcode == LOCK_PREFIX_OPCODE)
7837 return;
7838 i.prefix[LOCK_PREFIX] = 0;
7839 }
7840
7841 /* Since the VEX/EVEX prefix contains the implicit prefix, we
7842 don't need the explicit prefix. */
7843 if (!i.tm.opcode_modifier.vex && !i.tm.opcode_modifier.evex)
7844 {
7845 switch (i.tm.opcode_length)
7846 {
7847 case 3:
7848 if (i.tm.base_opcode & 0xff000000)
7849 {
7850 prefix = (i.tm.base_opcode >> 24) & 0xff;
7851 add_prefix (prefix);
7852 }
7853 break;
7854 case 2:
7855 if ((i.tm.base_opcode & 0xff0000) != 0)
7856 {
7857 prefix = (i.tm.base_opcode >> 16) & 0xff;
7858 if (!i.tm.cpu_flags.bitfield.cpupadlock
7859 || prefix != REPE_PREFIX_OPCODE
7860 || (i.prefix[REP_PREFIX] != REPE_PREFIX_OPCODE))
7861 add_prefix (prefix);
7862 }
7863 break;
7864 case 1:
7865 break;
7866 case 0:
7867 /* Check for pseudo prefixes. */
7868 as_bad_where (insn_start_frag->fr_file,
7869 insn_start_frag->fr_line,
7870 _("pseudo prefix without instruction"));
7871 return;
7872 default:
7873 abort ();
7874 }
7875
7876 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
7877 /* For x32, add a dummy REX_OPCODE prefix for mov/add with
7878 R_X86_64_GOTTPOFF relocation so that linker can safely
7879 perform IE->LE optimization. */
7880 if (x86_elf_abi == X86_64_X32_ABI
7881 && i.operands == 2
7882 && i.reloc[0] == BFD_RELOC_X86_64_GOTTPOFF
7883 && i.prefix[REX_PREFIX] == 0)
7884 add_prefix (REX_OPCODE);
7885 #endif
7886
7887 /* The prefix bytes. */
7888 for (j = ARRAY_SIZE (i.prefix), q = i.prefix; j > 0; j--, q++)
7889 if (*q)
7890 FRAG_APPEND_1_CHAR (*q);
7891 }
7892 else
7893 {
7894 for (j = 0, q = i.prefix; j < ARRAY_SIZE (i.prefix); j++, q++)
7895 if (*q)
7896 switch (j)
7897 {
7898 case REX_PREFIX:
7899 /* REX byte is encoded in VEX prefix. */
7900 break;
7901 case SEG_PREFIX:
7902 case ADDR_PREFIX:
7903 FRAG_APPEND_1_CHAR (*q);
7904 break;
7905 default:
7906 /* There should be no other prefixes for instructions
7907 with VEX prefix. */
7908 abort ();
7909 }
7910
7911 /* For EVEX instructions i.vrex should become 0 after
7912 build_evex_prefix. For VEX instructions upper 16 registers
7913 aren't available, so VREX should be 0. */
7914 if (i.vrex)
7915 abort ();
7916 /* Now the VEX prefix. */
7917 p = frag_more (i.vex.length);
7918 for (j = 0; j < i.vex.length; j++)
7919 p[j] = i.vex.bytes[j];
7920 }
7921
7922 /* Now the opcode; be careful about word order here! */
7923 if (i.tm.opcode_length == 1)
7924 {
7925 FRAG_APPEND_1_CHAR (i.tm.base_opcode);
7926 }
7927 else
7928 {
7929 switch (i.tm.opcode_length)
7930 {
7931 case 4:
7932 p = frag_more (4);
7933 *p++ = (i.tm.base_opcode >> 24) & 0xff;
7934 *p++ = (i.tm.base_opcode >> 16) & 0xff;
7935 break;
7936 case 3:
7937 p = frag_more (3);
7938 *p++ = (i.tm.base_opcode >> 16) & 0xff;
7939 break;
7940 case 2:
7941 p = frag_more (2);
7942 break;
7943 default:
7944 abort ();
7945 break;
7946 }
7947
7948 /* Put out high byte first: can't use md_number_to_chars! */
7949 *p++ = (i.tm.base_opcode >> 8) & 0xff;
7950 *p = i.tm.base_opcode & 0xff;
7951 }
7952
7953 /* Now the modrm byte and sib byte (if present). */
7954 if (i.tm.opcode_modifier.modrm)
7955 {
7956 FRAG_APPEND_1_CHAR ((i.rm.regmem << 0
7957 | i.rm.reg << 3
7958 | i.rm.mode << 6));
7959 /* If i.rm.regmem == ESP (4)
7960 && i.rm.mode != (Register mode)
7961 && not 16 bit
7962 ==> need second modrm byte. */
7963 if (i.rm.regmem == ESCAPE_TO_TWO_BYTE_ADDRESSING
7964 && i.rm.mode != 3
7965 && !(i.base_reg && i.base_reg->reg_type.bitfield.word))
7966 FRAG_APPEND_1_CHAR ((i.sib.base << 0
7967 | i.sib.index << 3
7968 | i.sib.scale << 6));
7969 }
7970
7971 if (i.disp_operands)
7972 output_disp (insn_start_frag, insn_start_off);
7973
7974 if (i.imm_operands)
7975 output_imm (insn_start_frag, insn_start_off);
7976 }
7977
7978 #ifdef DEBUG386
7979 if (flag_debug)
7980 {
7981 pi ("" /*line*/, &i);
7982 }
7983 #endif /* DEBUG386 */
7984 }
7985
7986 /* Return the size of the displacement operand N. */
7987
7988 static int
7989 disp_size (unsigned int n)
7990 {
7991 int size = 4;
7992
7993 if (i.types[n].bitfield.disp64)
7994 size = 8;
7995 else if (i.types[n].bitfield.disp8)
7996 size = 1;
7997 else if (i.types[n].bitfield.disp16)
7998 size = 2;
7999 return size;
8000 }
8001
8002 /* Return the size of the immediate operand N. */
8003
8004 static int
8005 imm_size (unsigned int n)
8006 {
8007 int size = 4;
8008 if (i.types[n].bitfield.imm64)
8009 size = 8;
8010 else if (i.types[n].bitfield.imm8 || i.types[n].bitfield.imm8s)
8011 size = 1;
8012 else if (i.types[n].bitfield.imm16)
8013 size = 2;
8014 return size;
8015 }
8016
8017 static void
8018 output_disp (fragS *insn_start_frag, offsetT insn_start_off)
8019 {
8020 char *p;
8021 unsigned int n;
8022
8023 for (n = 0; n < i.operands; n++)
8024 {
8025 if (operand_type_check (i.types[n], disp))
8026 {
8027 if (i.op[n].disps->X_op == O_constant)
8028 {
8029 int size = disp_size (n);
8030 offsetT val = i.op[n].disps->X_add_number;
8031
8032 val = offset_in_range (val >> (size == 1 ? i.memshift : 0),
8033 size);
8034 p = frag_more (size);
8035 md_number_to_chars (p, val, size);
8036 }
8037 else
8038 {
8039 enum bfd_reloc_code_real reloc_type;
8040 int size = disp_size (n);
8041 int sign = i.types[n].bitfield.disp32s;
8042 int pcrel = (i.flags[n] & Operand_PCrel) != 0;
8043 fixS *fixP;
8044
8045 /* We can't have 8 bit displacement here. */
8046 gas_assert (!i.types[n].bitfield.disp8);
8047
8048 /* The PC relative address is computed relative
8049 to the instruction boundary, so in case immediate
8050 fields follows, we need to adjust the value. */
8051 if (pcrel && i.imm_operands)
8052 {
8053 unsigned int n1;
8054 int sz = 0;
8055
8056 for (n1 = 0; n1 < i.operands; n1++)
8057 if (operand_type_check (i.types[n1], imm))
8058 {
8059 /* Only one immediate is allowed for PC
8060 relative address. */
8061 gas_assert (sz == 0);
8062 sz = imm_size (n1);
8063 i.op[n].disps->X_add_number -= sz;
8064 }
8065 /* We should find the immediate. */
8066 gas_assert (sz != 0);
8067 }
8068
8069 p = frag_more (size);
8070 reloc_type = reloc (size, pcrel, sign, i.reloc[n]);
8071 if (GOT_symbol
8072 && GOT_symbol == i.op[n].disps->X_add_symbol
8073 && (((reloc_type == BFD_RELOC_32
8074 || reloc_type == BFD_RELOC_X86_64_32S
8075 || (reloc_type == BFD_RELOC_64
8076 && object_64bit))
8077 && (i.op[n].disps->X_op == O_symbol
8078 || (i.op[n].disps->X_op == O_add
8079 && ((symbol_get_value_expression
8080 (i.op[n].disps->X_op_symbol)->X_op)
8081 == O_subtract))))
8082 || reloc_type == BFD_RELOC_32_PCREL))
8083 {
8084 offsetT add;
8085
8086 if (insn_start_frag == frag_now)
8087 add = (p - frag_now->fr_literal) - insn_start_off;
8088 else
8089 {
8090 fragS *fr;
8091
8092 add = insn_start_frag->fr_fix - insn_start_off;
8093 for (fr = insn_start_frag->fr_next;
8094 fr && fr != frag_now; fr = fr->fr_next)
8095 add += fr->fr_fix;
8096 add += p - frag_now->fr_literal;
8097 }
8098
8099 if (!object_64bit)
8100 {
8101 reloc_type = BFD_RELOC_386_GOTPC;
8102 i.op[n].imms->X_add_number += add;
8103 }
8104 else if (reloc_type == BFD_RELOC_64)
8105 reloc_type = BFD_RELOC_X86_64_GOTPC64;
8106 else
8107 /* Don't do the adjustment for x86-64, as there
8108 the pcrel addressing is relative to the _next_
8109 insn, and that is taken care of in other code. */
8110 reloc_type = BFD_RELOC_X86_64_GOTPC32;
8111 }
8112 fixP = fix_new_exp (frag_now, p - frag_now->fr_literal,
8113 size, i.op[n].disps, pcrel,
8114 reloc_type);
8115 /* Check for "call/jmp *mem", "mov mem, %reg",
8116 "test %reg, mem" and "binop mem, %reg" where binop
8117 is one of adc, add, and, cmp, or, sbb, sub, xor
8118 instructions. Always generate R_386_GOT32X for
8119 "sym*GOT" operand in 32-bit mode. */
8120 if ((generate_relax_relocations
8121 || (!object_64bit
8122 && i.rm.mode == 0
8123 && i.rm.regmem == 5))
8124 && (i.rm.mode == 2
8125 || (i.rm.mode == 0 && i.rm.regmem == 5))
8126 && ((i.operands == 1
8127 && i.tm.base_opcode == 0xff
8128 && (i.rm.reg == 2 || i.rm.reg == 4))
8129 || (i.operands == 2
8130 && (i.tm.base_opcode == 0x8b
8131 || i.tm.base_opcode == 0x85
8132 || (i.tm.base_opcode & 0xc7) == 0x03))))
8133 {
8134 if (object_64bit)
8135 {
8136 fixP->fx_tcbit = i.rex != 0;
8137 if (i.base_reg
8138 && (i.base_reg->reg_num == RegIP))
8139 fixP->fx_tcbit2 = 1;
8140 }
8141 else
8142 fixP->fx_tcbit2 = 1;
8143 }
8144 }
8145 }
8146 }
8147 }
8148
8149 static void
8150 output_imm (fragS *insn_start_frag, offsetT insn_start_off)
8151 {
8152 char *p;
8153 unsigned int n;
8154
8155 for (n = 0; n < i.operands; n++)
8156 {
8157 /* Skip SAE/RC Imm operand in EVEX. They are already handled. */
8158 if (i.rounding && (int) n == i.rounding->operand)
8159 continue;
8160
8161 if (operand_type_check (i.types[n], imm))
8162 {
8163 if (i.op[n].imms->X_op == O_constant)
8164 {
8165 int size = imm_size (n);
8166 offsetT val;
8167
8168 val = offset_in_range (i.op[n].imms->X_add_number,
8169 size);
8170 p = frag_more (size);
8171 md_number_to_chars (p, val, size);
8172 }
8173 else
8174 {
8175 /* Not absolute_section.
8176 Need a 32-bit fixup (don't support 8bit
8177 non-absolute imms). Try to support other
8178 sizes ... */
8179 enum bfd_reloc_code_real reloc_type;
8180 int size = imm_size (n);
8181 int sign;
8182
8183 if (i.types[n].bitfield.imm32s
8184 && (i.suffix == QWORD_MNEM_SUFFIX
8185 || (!i.suffix && i.tm.opcode_modifier.no_lsuf)))
8186 sign = 1;
8187 else
8188 sign = 0;
8189
8190 p = frag_more (size);
8191 reloc_type = reloc (size, 0, sign, i.reloc[n]);
8192
8193 /* This is tough to explain. We end up with this one if we
8194 * have operands that look like
8195 * "_GLOBAL_OFFSET_TABLE_+[.-.L284]". The goal here is to
8196 * obtain the absolute address of the GOT, and it is strongly
8197 * preferable from a performance point of view to avoid using
8198 * a runtime relocation for this. The actual sequence of
8199 * instructions often look something like:
8200 *
8201 * call .L66
8202 * .L66:
8203 * popl %ebx
8204 * addl $_GLOBAL_OFFSET_TABLE_+[.-.L66],%ebx
8205 *
8206 * The call and pop essentially return the absolute address
8207 * of the label .L66 and store it in %ebx. The linker itself
8208 * will ultimately change the first operand of the addl so
8209 * that %ebx points to the GOT, but to keep things simple, the
8210 * .o file must have this operand set so that it generates not
8211 * the absolute address of .L66, but the absolute address of
8212 * itself. This allows the linker itself simply treat a GOTPC
8213 * relocation as asking for a pcrel offset to the GOT to be
8214 * added in, and the addend of the relocation is stored in the
8215 * operand field for the instruction itself.
8216 *
8217 * Our job here is to fix the operand so that it would add
8218 * the correct offset so that %ebx would point to itself. The
8219 * thing that is tricky is that .-.L66 will point to the
8220 * beginning of the instruction, so we need to further modify
8221 * the operand so that it will point to itself. There are
8222 * other cases where you have something like:
8223 *
8224 * .long $_GLOBAL_OFFSET_TABLE_+[.-.L66]
8225 *
8226 * and here no correction would be required. Internally in
8227 * the assembler we treat operands of this form as not being
8228 * pcrel since the '.' is explicitly mentioned, and I wonder
8229 * whether it would simplify matters to do it this way. Who
8230 * knows. In earlier versions of the PIC patches, the
8231 * pcrel_adjust field was used to store the correction, but
8232 * since the expression is not pcrel, I felt it would be
8233 * confusing to do it this way. */
8234
8235 if ((reloc_type == BFD_RELOC_32
8236 || reloc_type == BFD_RELOC_X86_64_32S
8237 || reloc_type == BFD_RELOC_64)
8238 && GOT_symbol
8239 && GOT_symbol == i.op[n].imms->X_add_symbol
8240 && (i.op[n].imms->X_op == O_symbol
8241 || (i.op[n].imms->X_op == O_add
8242 && ((symbol_get_value_expression
8243 (i.op[n].imms->X_op_symbol)->X_op)
8244 == O_subtract))))
8245 {
8246 offsetT add;
8247
8248 if (insn_start_frag == frag_now)
8249 add = (p - frag_now->fr_literal) - insn_start_off;
8250 else
8251 {
8252 fragS *fr;
8253
8254 add = insn_start_frag->fr_fix - insn_start_off;
8255 for (fr = insn_start_frag->fr_next;
8256 fr && fr != frag_now; fr = fr->fr_next)
8257 add += fr->fr_fix;
8258 add += p - frag_now->fr_literal;
8259 }
8260
8261 if (!object_64bit)
8262 reloc_type = BFD_RELOC_386_GOTPC;
8263 else if (size == 4)
8264 reloc_type = BFD_RELOC_X86_64_GOTPC32;
8265 else if (size == 8)
8266 reloc_type = BFD_RELOC_X86_64_GOTPC64;
8267 i.op[n].imms->X_add_number += add;
8268 }
8269 fix_new_exp (frag_now, p - frag_now->fr_literal, size,
8270 i.op[n].imms, 0, reloc_type);
8271 }
8272 }
8273 }
8274 }
8275 \f
8276 /* x86_cons_fix_new is called via the expression parsing code when a
8277 reloc is needed. We use this hook to get the correct .got reloc. */
8278 static int cons_sign = -1;
8279
8280 void
8281 x86_cons_fix_new (fragS *frag, unsigned int off, unsigned int len,
8282 expressionS *exp, bfd_reloc_code_real_type r)
8283 {
8284 r = reloc (len, 0, cons_sign, r);
8285
8286 #ifdef TE_PE
8287 if (exp->X_op == O_secrel)
8288 {
8289 exp->X_op = O_symbol;
8290 r = BFD_RELOC_32_SECREL;
8291 }
8292 #endif
8293
8294 fix_new_exp (frag, off, len, exp, 0, r);
8295 }
8296
8297 /* Export the ABI address size for use by TC_ADDRESS_BYTES for the
8298 purpose of the `.dc.a' internal pseudo-op. */
8299
8300 int
8301 x86_address_bytes (void)
8302 {
8303 if ((stdoutput->arch_info->mach & bfd_mach_x64_32))
8304 return 4;
8305 return stdoutput->arch_info->bits_per_address / 8;
8306 }
8307
8308 #if !(defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) || defined (OBJ_MACH_O)) \
8309 || defined (LEX_AT)
8310 # define lex_got(reloc, adjust, types) NULL
8311 #else
8312 /* Parse operands of the form
8313 <symbol>@GOTOFF+<nnn>
8314 and similar .plt or .got references.
8315
8316 If we find one, set up the correct relocation in RELOC and copy the
8317 input string, minus the `@GOTOFF' into a malloc'd buffer for
8318 parsing by the calling routine. Return this buffer, and if ADJUST
8319 is non-null set it to the length of the string we removed from the
8320 input line. Otherwise return NULL. */
8321 static char *
8322 lex_got (enum bfd_reloc_code_real *rel,
8323 int *adjust,
8324 i386_operand_type *types)
8325 {
8326 /* Some of the relocations depend on the size of what field is to
8327 be relocated. But in our callers i386_immediate and i386_displacement
8328 we don't yet know the operand size (this will be set by insn
8329 matching). Hence we record the word32 relocation here,
8330 and adjust the reloc according to the real size in reloc(). */
8331 static const struct {
8332 const char *str;
8333 int len;
8334 const enum bfd_reloc_code_real rel[2];
8335 const i386_operand_type types64;
8336 } gotrel[] = {
8337 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8338 { STRING_COMMA_LEN ("SIZE"), { BFD_RELOC_SIZE32,
8339 BFD_RELOC_SIZE32 },
8340 OPERAND_TYPE_IMM32_64 },
8341 #endif
8342 { STRING_COMMA_LEN ("PLTOFF"), { _dummy_first_bfd_reloc_code_real,
8343 BFD_RELOC_X86_64_PLTOFF64 },
8344 OPERAND_TYPE_IMM64 },
8345 { STRING_COMMA_LEN ("PLT"), { BFD_RELOC_386_PLT32,
8346 BFD_RELOC_X86_64_PLT32 },
8347 OPERAND_TYPE_IMM32_32S_DISP32 },
8348 { STRING_COMMA_LEN ("GOTPLT"), { _dummy_first_bfd_reloc_code_real,
8349 BFD_RELOC_X86_64_GOTPLT64 },
8350 OPERAND_TYPE_IMM64_DISP64 },
8351 { STRING_COMMA_LEN ("GOTOFF"), { BFD_RELOC_386_GOTOFF,
8352 BFD_RELOC_X86_64_GOTOFF64 },
8353 OPERAND_TYPE_IMM64_DISP64 },
8354 { STRING_COMMA_LEN ("GOTPCREL"), { _dummy_first_bfd_reloc_code_real,
8355 BFD_RELOC_X86_64_GOTPCREL },
8356 OPERAND_TYPE_IMM32_32S_DISP32 },
8357 { STRING_COMMA_LEN ("TLSGD"), { BFD_RELOC_386_TLS_GD,
8358 BFD_RELOC_X86_64_TLSGD },
8359 OPERAND_TYPE_IMM32_32S_DISP32 },
8360 { STRING_COMMA_LEN ("TLSLDM"), { BFD_RELOC_386_TLS_LDM,
8361 _dummy_first_bfd_reloc_code_real },
8362 OPERAND_TYPE_NONE },
8363 { STRING_COMMA_LEN ("TLSLD"), { _dummy_first_bfd_reloc_code_real,
8364 BFD_RELOC_X86_64_TLSLD },
8365 OPERAND_TYPE_IMM32_32S_DISP32 },
8366 { STRING_COMMA_LEN ("GOTTPOFF"), { BFD_RELOC_386_TLS_IE_32,
8367 BFD_RELOC_X86_64_GOTTPOFF },
8368 OPERAND_TYPE_IMM32_32S_DISP32 },
8369 { STRING_COMMA_LEN ("TPOFF"), { BFD_RELOC_386_TLS_LE_32,
8370 BFD_RELOC_X86_64_TPOFF32 },
8371 OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
8372 { STRING_COMMA_LEN ("NTPOFF"), { BFD_RELOC_386_TLS_LE,
8373 _dummy_first_bfd_reloc_code_real },
8374 OPERAND_TYPE_NONE },
8375 { STRING_COMMA_LEN ("DTPOFF"), { BFD_RELOC_386_TLS_LDO_32,
8376 BFD_RELOC_X86_64_DTPOFF32 },
8377 OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
8378 { STRING_COMMA_LEN ("GOTNTPOFF"),{ BFD_RELOC_386_TLS_GOTIE,
8379 _dummy_first_bfd_reloc_code_real },
8380 OPERAND_TYPE_NONE },
8381 { STRING_COMMA_LEN ("INDNTPOFF"),{ BFD_RELOC_386_TLS_IE,
8382 _dummy_first_bfd_reloc_code_real },
8383 OPERAND_TYPE_NONE },
8384 { STRING_COMMA_LEN ("GOT"), { BFD_RELOC_386_GOT32,
8385 BFD_RELOC_X86_64_GOT32 },
8386 OPERAND_TYPE_IMM32_32S_64_DISP32 },
8387 { STRING_COMMA_LEN ("TLSDESC"), { BFD_RELOC_386_TLS_GOTDESC,
8388 BFD_RELOC_X86_64_GOTPC32_TLSDESC },
8389 OPERAND_TYPE_IMM32_32S_DISP32 },
8390 { STRING_COMMA_LEN ("TLSCALL"), { BFD_RELOC_386_TLS_DESC_CALL,
8391 BFD_RELOC_X86_64_TLSDESC_CALL },
8392 OPERAND_TYPE_IMM32_32S_DISP32 },
8393 };
8394 char *cp;
8395 unsigned int j;
8396
8397 #if defined (OBJ_MAYBE_ELF)
8398 if (!IS_ELF)
8399 return NULL;
8400 #endif
8401
8402 for (cp = input_line_pointer; *cp != '@'; cp++)
8403 if (is_end_of_line[(unsigned char) *cp] || *cp == ',')
8404 return NULL;
8405
8406 for (j = 0; j < ARRAY_SIZE (gotrel); j++)
8407 {
8408 int len = gotrel[j].len;
8409 if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
8410 {
8411 if (gotrel[j].rel[object_64bit] != 0)
8412 {
8413 int first, second;
8414 char *tmpbuf, *past_reloc;
8415
8416 *rel = gotrel[j].rel[object_64bit];
8417
8418 if (types)
8419 {
8420 if (flag_code != CODE_64BIT)
8421 {
8422 types->bitfield.imm32 = 1;
8423 types->bitfield.disp32 = 1;
8424 }
8425 else
8426 *types = gotrel[j].types64;
8427 }
8428
8429 if (j != 0 && GOT_symbol == NULL)
8430 GOT_symbol = symbol_find_or_make (GLOBAL_OFFSET_TABLE_NAME);
8431
8432 /* The length of the first part of our input line. */
8433 first = cp - input_line_pointer;
8434
8435 /* The second part goes from after the reloc token until
8436 (and including) an end_of_line char or comma. */
8437 past_reloc = cp + 1 + len;
8438 cp = past_reloc;
8439 while (!is_end_of_line[(unsigned char) *cp] && *cp != ',')
8440 ++cp;
8441 second = cp + 1 - past_reloc;
8442
8443 /* Allocate and copy string. The trailing NUL shouldn't
8444 be necessary, but be safe. */
8445 tmpbuf = XNEWVEC (char, first + second + 2);
8446 memcpy (tmpbuf, input_line_pointer, first);
8447 if (second != 0 && *past_reloc != ' ')
8448 /* Replace the relocation token with ' ', so that
8449 errors like foo@GOTOFF1 will be detected. */
8450 tmpbuf[first++] = ' ';
8451 else
8452 /* Increment length by 1 if the relocation token is
8453 removed. */
8454 len++;
8455 if (adjust)
8456 *adjust = len;
8457 memcpy (tmpbuf + first, past_reloc, second);
8458 tmpbuf[first + second] = '\0';
8459 return tmpbuf;
8460 }
8461
8462 as_bad (_("@%s reloc is not supported with %d-bit output format"),
8463 gotrel[j].str, 1 << (5 + object_64bit));
8464 return NULL;
8465 }
8466 }
8467
8468 /* Might be a symbol version string. Don't as_bad here. */
8469 return NULL;
8470 }
8471 #endif
8472
8473 #ifdef TE_PE
8474 #ifdef lex_got
8475 #undef lex_got
8476 #endif
8477 /* Parse operands of the form
8478 <symbol>@SECREL32+<nnn>
8479
8480 If we find one, set up the correct relocation in RELOC and copy the
8481 input string, minus the `@SECREL32' into a malloc'd buffer for
8482 parsing by the calling routine. Return this buffer, and if ADJUST
8483 is non-null set it to the length of the string we removed from the
8484 input line. Otherwise return NULL.
8485
8486 This function is copied from the ELF version above adjusted for PE targets. */
8487
8488 static char *
8489 lex_got (enum bfd_reloc_code_real *rel ATTRIBUTE_UNUSED,
8490 int *adjust ATTRIBUTE_UNUSED,
8491 i386_operand_type *types)
8492 {
8493 static const struct
8494 {
8495 const char *str;
8496 int len;
8497 const enum bfd_reloc_code_real rel[2];
8498 const i386_operand_type types64;
8499 }
8500 gotrel[] =
8501 {
8502 { STRING_COMMA_LEN ("SECREL32"), { BFD_RELOC_32_SECREL,
8503 BFD_RELOC_32_SECREL },
8504 OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
8505 };
8506
8507 char *cp;
8508 unsigned j;
8509
8510 for (cp = input_line_pointer; *cp != '@'; cp++)
8511 if (is_end_of_line[(unsigned char) *cp] || *cp == ',')
8512 return NULL;
8513
8514 for (j = 0; j < ARRAY_SIZE (gotrel); j++)
8515 {
8516 int len = gotrel[j].len;
8517
8518 if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
8519 {
8520 if (gotrel[j].rel[object_64bit] != 0)
8521 {
8522 int first, second;
8523 char *tmpbuf, *past_reloc;
8524
8525 *rel = gotrel[j].rel[object_64bit];
8526 if (adjust)
8527 *adjust = len;
8528
8529 if (types)
8530 {
8531 if (flag_code != CODE_64BIT)
8532 {
8533 types->bitfield.imm32 = 1;
8534 types->bitfield.disp32 = 1;
8535 }
8536 else
8537 *types = gotrel[j].types64;
8538 }
8539
8540 /* The length of the first part of our input line. */
8541 first = cp - input_line_pointer;
8542
8543 /* The second part goes from after the reloc token until
8544 (and including) an end_of_line char or comma. */
8545 past_reloc = cp + 1 + len;
8546 cp = past_reloc;
8547 while (!is_end_of_line[(unsigned char) *cp] && *cp != ',')
8548 ++cp;
8549 second = cp + 1 - past_reloc;
8550
8551 /* Allocate and copy string. The trailing NUL shouldn't
8552 be necessary, but be safe. */
8553 tmpbuf = XNEWVEC (char, first + second + 2);
8554 memcpy (tmpbuf, input_line_pointer, first);
8555 if (second != 0 && *past_reloc != ' ')
8556 /* Replace the relocation token with ' ', so that
8557 errors like foo@SECLREL321 will be detected. */
8558 tmpbuf[first++] = ' ';
8559 memcpy (tmpbuf + first, past_reloc, second);
8560 tmpbuf[first + second] = '\0';
8561 return tmpbuf;
8562 }
8563
8564 as_bad (_("@%s reloc is not supported with %d-bit output format"),
8565 gotrel[j].str, 1 << (5 + object_64bit));
8566 return NULL;
8567 }
8568 }
8569
8570 /* Might be a symbol version string. Don't as_bad here. */
8571 return NULL;
8572 }
8573
8574 #endif /* TE_PE */
8575
8576 bfd_reloc_code_real_type
8577 x86_cons (expressionS *exp, int size)
8578 {
8579 bfd_reloc_code_real_type got_reloc = NO_RELOC;
8580
8581 intel_syntax = -intel_syntax;
8582
8583 exp->X_md = 0;
8584 if (size == 4 || (object_64bit && size == 8))
8585 {
8586 /* Handle @GOTOFF and the like in an expression. */
8587 char *save;
8588 char *gotfree_input_line;
8589 int adjust = 0;
8590
8591 save = input_line_pointer;
8592 gotfree_input_line = lex_got (&got_reloc, &adjust, NULL);
8593 if (gotfree_input_line)
8594 input_line_pointer = gotfree_input_line;
8595
8596 expression (exp);
8597
8598 if (gotfree_input_line)
8599 {
8600 /* expression () has merrily parsed up to the end of line,
8601 or a comma - in the wrong buffer. Transfer how far
8602 input_line_pointer has moved to the right buffer. */
8603 input_line_pointer = (save
8604 + (input_line_pointer - gotfree_input_line)
8605 + adjust);
8606 free (gotfree_input_line);
8607 if (exp->X_op == O_constant
8608 || exp->X_op == O_absent
8609 || exp->X_op == O_illegal
8610 || exp->X_op == O_register
8611 || exp->X_op == O_big)
8612 {
8613 char c = *input_line_pointer;
8614 *input_line_pointer = 0;
8615 as_bad (_("missing or invalid expression `%s'"), save);
8616 *input_line_pointer = c;
8617 }
8618 }
8619 }
8620 else
8621 expression (exp);
8622
8623 intel_syntax = -intel_syntax;
8624
8625 if (intel_syntax)
8626 i386_intel_simplify (exp);
8627
8628 return got_reloc;
8629 }
8630
8631 static void
8632 signed_cons (int size)
8633 {
8634 if (flag_code == CODE_64BIT)
8635 cons_sign = 1;
8636 cons (size);
8637 cons_sign = -1;
8638 }
8639
8640 #ifdef TE_PE
8641 static void
8642 pe_directive_secrel (int dummy ATTRIBUTE_UNUSED)
8643 {
8644 expressionS exp;
8645
8646 do
8647 {
8648 expression (&exp);
8649 if (exp.X_op == O_symbol)
8650 exp.X_op = O_secrel;
8651
8652 emit_expr (&exp, 4);
8653 }
8654 while (*input_line_pointer++ == ',');
8655
8656 input_line_pointer--;
8657 demand_empty_rest_of_line ();
8658 }
8659 #endif
8660
8661 /* Handle Vector operations. */
8662
8663 static char *
8664 check_VecOperations (char *op_string, char *op_end)
8665 {
8666 const reg_entry *mask;
8667 const char *saved;
8668 char *end_op;
8669
8670 while (*op_string
8671 && (op_end == NULL || op_string < op_end))
8672 {
8673 saved = op_string;
8674 if (*op_string == '{')
8675 {
8676 op_string++;
8677
8678 /* Check broadcasts. */
8679 if (strncmp (op_string, "1to", 3) == 0)
8680 {
8681 int bcst_type;
8682
8683 if (i.broadcast)
8684 goto duplicated_vec_op;
8685
8686 op_string += 3;
8687 if (*op_string == '8')
8688 bcst_type = 8;
8689 else if (*op_string == '4')
8690 bcst_type = 4;
8691 else if (*op_string == '2')
8692 bcst_type = 2;
8693 else if (*op_string == '1'
8694 && *(op_string+1) == '6')
8695 {
8696 bcst_type = 16;
8697 op_string++;
8698 }
8699 else
8700 {
8701 as_bad (_("Unsupported broadcast: `%s'"), saved);
8702 return NULL;
8703 }
8704 op_string++;
8705
8706 broadcast_op.type = bcst_type;
8707 broadcast_op.operand = this_operand;
8708 broadcast_op.bytes = 0;
8709 i.broadcast = &broadcast_op;
8710 }
8711 /* Check masking operation. */
8712 else if ((mask = parse_register (op_string, &end_op)) != NULL)
8713 {
8714 /* k0 can't be used for write mask. */
8715 if (!mask->reg_type.bitfield.regmask || mask->reg_num == 0)
8716 {
8717 as_bad (_("`%s%s' can't be used for write mask"),
8718 register_prefix, mask->reg_name);
8719 return NULL;
8720 }
8721
8722 if (!i.mask)
8723 {
8724 mask_op.mask = mask;
8725 mask_op.zeroing = 0;
8726 mask_op.operand = this_operand;
8727 i.mask = &mask_op;
8728 }
8729 else
8730 {
8731 if (i.mask->mask)
8732 goto duplicated_vec_op;
8733
8734 i.mask->mask = mask;
8735
8736 /* Only "{z}" is allowed here. No need to check
8737 zeroing mask explicitly. */
8738 if (i.mask->operand != this_operand)
8739 {
8740 as_bad (_("invalid write mask `%s'"), saved);
8741 return NULL;
8742 }
8743 }
8744
8745 op_string = end_op;
8746 }
8747 /* Check zeroing-flag for masking operation. */
8748 else if (*op_string == 'z')
8749 {
8750 if (!i.mask)
8751 {
8752 mask_op.mask = NULL;
8753 mask_op.zeroing = 1;
8754 mask_op.operand = this_operand;
8755 i.mask = &mask_op;
8756 }
8757 else
8758 {
8759 if (i.mask->zeroing)
8760 {
8761 duplicated_vec_op:
8762 as_bad (_("duplicated `%s'"), saved);
8763 return NULL;
8764 }
8765
8766 i.mask->zeroing = 1;
8767
8768 /* Only "{%k}" is allowed here. No need to check mask
8769 register explicitly. */
8770 if (i.mask->operand != this_operand)
8771 {
8772 as_bad (_("invalid zeroing-masking `%s'"),
8773 saved);
8774 return NULL;
8775 }
8776 }
8777
8778 op_string++;
8779 }
8780 else
8781 goto unknown_vec_op;
8782
8783 if (*op_string != '}')
8784 {
8785 as_bad (_("missing `}' in `%s'"), saved);
8786 return NULL;
8787 }
8788 op_string++;
8789
8790 /* Strip whitespace since the addition of pseudo prefixes
8791 changed how the scrubber treats '{'. */
8792 if (is_space_char (*op_string))
8793 ++op_string;
8794
8795 continue;
8796 }
8797 unknown_vec_op:
8798 /* We don't know this one. */
8799 as_bad (_("unknown vector operation: `%s'"), saved);
8800 return NULL;
8801 }
8802
8803 if (i.mask && i.mask->zeroing && !i.mask->mask)
8804 {
8805 as_bad (_("zeroing-masking only allowed with write mask"));
8806 return NULL;
8807 }
8808
8809 return op_string;
8810 }
8811
8812 static int
8813 i386_immediate (char *imm_start)
8814 {
8815 char *save_input_line_pointer;
8816 char *gotfree_input_line;
8817 segT exp_seg = 0;
8818 expressionS *exp;
8819 i386_operand_type types;
8820
8821 operand_type_set (&types, ~0);
8822
8823 if (i.imm_operands == MAX_IMMEDIATE_OPERANDS)
8824 {
8825 as_bad (_("at most %d immediate operands are allowed"),
8826 MAX_IMMEDIATE_OPERANDS);
8827 return 0;
8828 }
8829
8830 exp = &im_expressions[i.imm_operands++];
8831 i.op[this_operand].imms = exp;
8832
8833 if (is_space_char (*imm_start))
8834 ++imm_start;
8835
8836 save_input_line_pointer = input_line_pointer;
8837 input_line_pointer = imm_start;
8838
8839 gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
8840 if (gotfree_input_line)
8841 input_line_pointer = gotfree_input_line;
8842
8843 exp_seg = expression (exp);
8844
8845 SKIP_WHITESPACE ();
8846
8847 /* Handle vector operations. */
8848 if (*input_line_pointer == '{')
8849 {
8850 input_line_pointer = check_VecOperations (input_line_pointer,
8851 NULL);
8852 if (input_line_pointer == NULL)
8853 return 0;
8854 }
8855
8856 if (*input_line_pointer)
8857 as_bad (_("junk `%s' after expression"), input_line_pointer);
8858
8859 input_line_pointer = save_input_line_pointer;
8860 if (gotfree_input_line)
8861 {
8862 free (gotfree_input_line);
8863
8864 if (exp->X_op == O_constant || exp->X_op == O_register)
8865 exp->X_op = O_illegal;
8866 }
8867
8868 return i386_finalize_immediate (exp_seg, exp, types, imm_start);
8869 }
8870
8871 static int
8872 i386_finalize_immediate (segT exp_seg ATTRIBUTE_UNUSED, expressionS *exp,
8873 i386_operand_type types, const char *imm_start)
8874 {
8875 if (exp->X_op == O_absent || exp->X_op == O_illegal || exp->X_op == O_big)
8876 {
8877 if (imm_start)
8878 as_bad (_("missing or invalid immediate expression `%s'"),
8879 imm_start);
8880 return 0;
8881 }
8882 else if (exp->X_op == O_constant)
8883 {
8884 /* Size it properly later. */
8885 i.types[this_operand].bitfield.imm64 = 1;
8886 /* If not 64bit, sign extend val. */
8887 if (flag_code != CODE_64BIT
8888 && (exp->X_add_number & ~(((addressT) 2 << 31) - 1)) == 0)
8889 exp->X_add_number
8890 = (exp->X_add_number ^ ((addressT) 1 << 31)) - ((addressT) 1 << 31);
8891 }
8892 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
8893 else if (OUTPUT_FLAVOR == bfd_target_aout_flavour
8894 && exp_seg != absolute_section
8895 && exp_seg != text_section
8896 && exp_seg != data_section
8897 && exp_seg != bss_section
8898 && exp_seg != undefined_section
8899 && !bfd_is_com_section (exp_seg))
8900 {
8901 as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
8902 return 0;
8903 }
8904 #endif
8905 else if (!intel_syntax && exp_seg == reg_section)
8906 {
8907 if (imm_start)
8908 as_bad (_("illegal immediate register operand %s"), imm_start);
8909 return 0;
8910 }
8911 else
8912 {
8913 /* This is an address. The size of the address will be
8914 determined later, depending on destination register,
8915 suffix, or the default for the section. */
8916 i.types[this_operand].bitfield.imm8 = 1;
8917 i.types[this_operand].bitfield.imm16 = 1;
8918 i.types[this_operand].bitfield.imm32 = 1;
8919 i.types[this_operand].bitfield.imm32s = 1;
8920 i.types[this_operand].bitfield.imm64 = 1;
8921 i.types[this_operand] = operand_type_and (i.types[this_operand],
8922 types);
8923 }
8924
8925 return 1;
8926 }
8927
8928 static char *
8929 i386_scale (char *scale)
8930 {
8931 offsetT val;
8932 char *save = input_line_pointer;
8933
8934 input_line_pointer = scale;
8935 val = get_absolute_expression ();
8936
8937 switch (val)
8938 {
8939 case 1:
8940 i.log2_scale_factor = 0;
8941 break;
8942 case 2:
8943 i.log2_scale_factor = 1;
8944 break;
8945 case 4:
8946 i.log2_scale_factor = 2;
8947 break;
8948 case 8:
8949 i.log2_scale_factor = 3;
8950 break;
8951 default:
8952 {
8953 char sep = *input_line_pointer;
8954
8955 *input_line_pointer = '\0';
8956 as_bad (_("expecting scale factor of 1, 2, 4, or 8: got `%s'"),
8957 scale);
8958 *input_line_pointer = sep;
8959 input_line_pointer = save;
8960 return NULL;
8961 }
8962 }
8963 if (i.log2_scale_factor != 0 && i.index_reg == 0)
8964 {
8965 as_warn (_("scale factor of %d without an index register"),
8966 1 << i.log2_scale_factor);
8967 i.log2_scale_factor = 0;
8968 }
8969 scale = input_line_pointer;
8970 input_line_pointer = save;
8971 return scale;
8972 }
8973
8974 static int
8975 i386_displacement (char *disp_start, char *disp_end)
8976 {
8977 expressionS *exp;
8978 segT exp_seg = 0;
8979 char *save_input_line_pointer;
8980 char *gotfree_input_line;
8981 int override;
8982 i386_operand_type bigdisp, types = anydisp;
8983 int ret;
8984
8985 if (i.disp_operands == MAX_MEMORY_OPERANDS)
8986 {
8987 as_bad (_("at most %d displacement operands are allowed"),
8988 MAX_MEMORY_OPERANDS);
8989 return 0;
8990 }
8991
8992 operand_type_set (&bigdisp, 0);
8993 if ((i.types[this_operand].bitfield.jumpabsolute)
8994 || (!current_templates->start->opcode_modifier.jump
8995 && !current_templates->start->opcode_modifier.jumpdword))
8996 {
8997 bigdisp.bitfield.disp32 = 1;
8998 override = (i.prefix[ADDR_PREFIX] != 0);
8999 if (flag_code == CODE_64BIT)
9000 {
9001 if (!override)
9002 {
9003 bigdisp.bitfield.disp32s = 1;
9004 bigdisp.bitfield.disp64 = 1;
9005 }
9006 }
9007 else if ((flag_code == CODE_16BIT) ^ override)
9008 {
9009 bigdisp.bitfield.disp32 = 0;
9010 bigdisp.bitfield.disp16 = 1;
9011 }
9012 }
9013 else
9014 {
9015 /* For PC-relative branches, the width of the displacement
9016 is dependent upon data size, not address size. */
9017 override = (i.prefix[DATA_PREFIX] != 0);
9018 if (flag_code == CODE_64BIT)
9019 {
9020 if (override || i.suffix == WORD_MNEM_SUFFIX)
9021 bigdisp.bitfield.disp16 = 1;
9022 else
9023 {
9024 bigdisp.bitfield.disp32 = 1;
9025 bigdisp.bitfield.disp32s = 1;
9026 }
9027 }
9028 else
9029 {
9030 if (!override)
9031 override = (i.suffix == (flag_code != CODE_16BIT
9032 ? WORD_MNEM_SUFFIX
9033 : LONG_MNEM_SUFFIX));
9034 bigdisp.bitfield.disp32 = 1;
9035 if ((flag_code == CODE_16BIT) ^ override)
9036 {
9037 bigdisp.bitfield.disp32 = 0;
9038 bigdisp.bitfield.disp16 = 1;
9039 }
9040 }
9041 }
9042 i.types[this_operand] = operand_type_or (i.types[this_operand],
9043 bigdisp);
9044
9045 exp = &disp_expressions[i.disp_operands];
9046 i.op[this_operand].disps = exp;
9047 i.disp_operands++;
9048 save_input_line_pointer = input_line_pointer;
9049 input_line_pointer = disp_start;
9050 END_STRING_AND_SAVE (disp_end);
9051
9052 #ifndef GCC_ASM_O_HACK
9053 #define GCC_ASM_O_HACK 0
9054 #endif
9055 #if GCC_ASM_O_HACK
9056 END_STRING_AND_SAVE (disp_end + 1);
9057 if (i.types[this_operand].bitfield.baseIndex
9058 && displacement_string_end[-1] == '+')
9059 {
9060 /* This hack is to avoid a warning when using the "o"
9061 constraint within gcc asm statements.
9062 For instance:
9063
9064 #define _set_tssldt_desc(n,addr,limit,type) \
9065 __asm__ __volatile__ ( \
9066 "movw %w2,%0\n\t" \
9067 "movw %w1,2+%0\n\t" \
9068 "rorl $16,%1\n\t" \
9069 "movb %b1,4+%0\n\t" \
9070 "movb %4,5+%0\n\t" \
9071 "movb $0,6+%0\n\t" \
9072 "movb %h1,7+%0\n\t" \
9073 "rorl $16,%1" \
9074 : "=o"(*(n)) : "q" (addr), "ri"(limit), "i"(type))
9075
9076 This works great except that the output assembler ends
9077 up looking a bit weird if it turns out that there is
9078 no offset. You end up producing code that looks like:
9079
9080 #APP
9081 movw $235,(%eax)
9082 movw %dx,2+(%eax)
9083 rorl $16,%edx
9084 movb %dl,4+(%eax)
9085 movb $137,5+(%eax)
9086 movb $0,6+(%eax)
9087 movb %dh,7+(%eax)
9088 rorl $16,%edx
9089 #NO_APP
9090
9091 So here we provide the missing zero. */
9092
9093 *displacement_string_end = '0';
9094 }
9095 #endif
9096 gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
9097 if (gotfree_input_line)
9098 input_line_pointer = gotfree_input_line;
9099
9100 exp_seg = expression (exp);
9101
9102 SKIP_WHITESPACE ();
9103 if (*input_line_pointer)
9104 as_bad (_("junk `%s' after expression"), input_line_pointer);
9105 #if GCC_ASM_O_HACK
9106 RESTORE_END_STRING (disp_end + 1);
9107 #endif
9108 input_line_pointer = save_input_line_pointer;
9109 if (gotfree_input_line)
9110 {
9111 free (gotfree_input_line);
9112
9113 if (exp->X_op == O_constant || exp->X_op == O_register)
9114 exp->X_op = O_illegal;
9115 }
9116
9117 ret = i386_finalize_displacement (exp_seg, exp, types, disp_start);
9118
9119 RESTORE_END_STRING (disp_end);
9120
9121 return ret;
9122 }
9123
9124 static int
9125 i386_finalize_displacement (segT exp_seg ATTRIBUTE_UNUSED, expressionS *exp,
9126 i386_operand_type types, const char *disp_start)
9127 {
9128 i386_operand_type bigdisp;
9129 int ret = 1;
9130
9131 /* We do this to make sure that the section symbol is in
9132 the symbol table. We will ultimately change the relocation
9133 to be relative to the beginning of the section. */
9134 if (i.reloc[this_operand] == BFD_RELOC_386_GOTOFF
9135 || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL
9136 || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
9137 {
9138 if (exp->X_op != O_symbol)
9139 goto inv_disp;
9140
9141 if (S_IS_LOCAL (exp->X_add_symbol)
9142 && S_GET_SEGMENT (exp->X_add_symbol) != undefined_section
9143 && S_GET_SEGMENT (exp->X_add_symbol) != expr_section)
9144 section_symbol (S_GET_SEGMENT (exp->X_add_symbol));
9145 exp->X_op = O_subtract;
9146 exp->X_op_symbol = GOT_symbol;
9147 if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL)
9148 i.reloc[this_operand] = BFD_RELOC_32_PCREL;
9149 else if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
9150 i.reloc[this_operand] = BFD_RELOC_64;
9151 else
9152 i.reloc[this_operand] = BFD_RELOC_32;
9153 }
9154
9155 else if (exp->X_op == O_absent
9156 || exp->X_op == O_illegal
9157 || exp->X_op == O_big)
9158 {
9159 inv_disp:
9160 as_bad (_("missing or invalid displacement expression `%s'"),
9161 disp_start);
9162 ret = 0;
9163 }
9164
9165 else if (flag_code == CODE_64BIT
9166 && !i.prefix[ADDR_PREFIX]
9167 && exp->X_op == O_constant)
9168 {
9169 /* Since displacement is signed extended to 64bit, don't allow
9170 disp32 and turn off disp32s if they are out of range. */
9171 i.types[this_operand].bitfield.disp32 = 0;
9172 if (!fits_in_signed_long (exp->X_add_number))
9173 {
9174 i.types[this_operand].bitfield.disp32s = 0;
9175 if (i.types[this_operand].bitfield.baseindex)
9176 {
9177 as_bad (_("0x%lx out range of signed 32bit displacement"),
9178 (long) exp->X_add_number);
9179 ret = 0;
9180 }
9181 }
9182 }
9183
9184 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
9185 else if (exp->X_op != O_constant
9186 && OUTPUT_FLAVOR == bfd_target_aout_flavour
9187 && exp_seg != absolute_section
9188 && exp_seg != text_section
9189 && exp_seg != data_section
9190 && exp_seg != bss_section
9191 && exp_seg != undefined_section
9192 && !bfd_is_com_section (exp_seg))
9193 {
9194 as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
9195 ret = 0;
9196 }
9197 #endif
9198
9199 /* Check if this is a displacement only operand. */
9200 bigdisp = i.types[this_operand];
9201 bigdisp.bitfield.disp8 = 0;
9202 bigdisp.bitfield.disp16 = 0;
9203 bigdisp.bitfield.disp32 = 0;
9204 bigdisp.bitfield.disp32s = 0;
9205 bigdisp.bitfield.disp64 = 0;
9206 if (operand_type_all_zero (&bigdisp))
9207 i.types[this_operand] = operand_type_and (i.types[this_operand],
9208 types);
9209
9210 return ret;
9211 }
9212
9213 /* Return the active addressing mode, taking address override and
9214 registers forming the address into consideration. Update the
9215 address override prefix if necessary. */
9216
9217 static enum flag_code
9218 i386_addressing_mode (void)
9219 {
9220 enum flag_code addr_mode;
9221
9222 if (i.prefix[ADDR_PREFIX])
9223 addr_mode = flag_code == CODE_32BIT ? CODE_16BIT : CODE_32BIT;
9224 else
9225 {
9226 addr_mode = flag_code;
9227
9228 #if INFER_ADDR_PREFIX
9229 if (i.mem_operands == 0)
9230 {
9231 /* Infer address prefix from the first memory operand. */
9232 const reg_entry *addr_reg = i.base_reg;
9233
9234 if (addr_reg == NULL)
9235 addr_reg = i.index_reg;
9236
9237 if (addr_reg)
9238 {
9239 if (addr_reg->reg_type.bitfield.dword)
9240 addr_mode = CODE_32BIT;
9241 else if (flag_code != CODE_64BIT
9242 && addr_reg->reg_type.bitfield.word)
9243 addr_mode = CODE_16BIT;
9244
9245 if (addr_mode != flag_code)
9246 {
9247 i.prefix[ADDR_PREFIX] = ADDR_PREFIX_OPCODE;
9248 i.prefixes += 1;
9249 /* Change the size of any displacement too. At most one
9250 of Disp16 or Disp32 is set.
9251 FIXME. There doesn't seem to be any real need for
9252 separate Disp16 and Disp32 flags. The same goes for
9253 Imm16 and Imm32. Removing them would probably clean
9254 up the code quite a lot. */
9255 if (flag_code != CODE_64BIT
9256 && (i.types[this_operand].bitfield.disp16
9257 || i.types[this_operand].bitfield.disp32))
9258 i.types[this_operand]
9259 = operand_type_xor (i.types[this_operand], disp16_32);
9260 }
9261 }
9262 }
9263 #endif
9264 }
9265
9266 return addr_mode;
9267 }
9268
9269 /* Make sure the memory operand we've been dealt is valid.
9270 Return 1 on success, 0 on a failure. */
9271
9272 static int
9273 i386_index_check (const char *operand_string)
9274 {
9275 const char *kind = "base/index";
9276 enum flag_code addr_mode = i386_addressing_mode ();
9277
9278 if (current_templates->start->opcode_modifier.isstring
9279 && !current_templates->start->opcode_modifier.immext
9280 && (current_templates->end[-1].opcode_modifier.isstring
9281 || i.mem_operands))
9282 {
9283 /* Memory operands of string insns are special in that they only allow
9284 a single register (rDI, rSI, or rBX) as their memory address. */
9285 const reg_entry *expected_reg;
9286 static const char *di_si[][2] =
9287 {
9288 { "esi", "edi" },
9289 { "si", "di" },
9290 { "rsi", "rdi" }
9291 };
9292 static const char *bx[] = { "ebx", "bx", "rbx" };
9293
9294 kind = "string address";
9295
9296 if (current_templates->start->opcode_modifier.repprefixok)
9297 {
9298 i386_operand_type type = current_templates->end[-1].operand_types[0];
9299
9300 if (!type.bitfield.baseindex
9301 || ((!i.mem_operands != !intel_syntax)
9302 && current_templates->end[-1].operand_types[1]
9303 .bitfield.baseindex))
9304 type = current_templates->end[-1].operand_types[1];
9305 expected_reg = hash_find (reg_hash,
9306 di_si[addr_mode][type.bitfield.esseg]);
9307
9308 }
9309 else
9310 expected_reg = hash_find (reg_hash, bx[addr_mode]);
9311
9312 if (i.base_reg != expected_reg
9313 || i.index_reg
9314 || operand_type_check (i.types[this_operand], disp))
9315 {
9316 /* The second memory operand must have the same size as
9317 the first one. */
9318 if (i.mem_operands
9319 && i.base_reg
9320 && !((addr_mode == CODE_64BIT
9321 && i.base_reg->reg_type.bitfield.qword)
9322 || (addr_mode == CODE_32BIT
9323 ? i.base_reg->reg_type.bitfield.dword
9324 : i.base_reg->reg_type.bitfield.word)))
9325 goto bad_address;
9326
9327 as_warn (_("`%s' is not valid here (expected `%c%s%s%c')"),
9328 operand_string,
9329 intel_syntax ? '[' : '(',
9330 register_prefix,
9331 expected_reg->reg_name,
9332 intel_syntax ? ']' : ')');
9333 return 1;
9334 }
9335 else
9336 return 1;
9337
9338 bad_address:
9339 as_bad (_("`%s' is not a valid %s expression"),
9340 operand_string, kind);
9341 return 0;
9342 }
9343 else
9344 {
9345 if (addr_mode != CODE_16BIT)
9346 {
9347 /* 32-bit/64-bit checks. */
9348 if ((i.base_reg
9349 && ((addr_mode == CODE_64BIT
9350 ? !i.base_reg->reg_type.bitfield.qword
9351 : !i.base_reg->reg_type.bitfield.dword)
9352 || (i.index_reg && i.base_reg->reg_num == RegIP)
9353 || i.base_reg->reg_num == RegIZ))
9354 || (i.index_reg
9355 && !i.index_reg->reg_type.bitfield.xmmword
9356 && !i.index_reg->reg_type.bitfield.ymmword
9357 && !i.index_reg->reg_type.bitfield.zmmword
9358 && ((addr_mode == CODE_64BIT
9359 ? !i.index_reg->reg_type.bitfield.qword
9360 : !i.index_reg->reg_type.bitfield.dword)
9361 || !i.index_reg->reg_type.bitfield.baseindex)))
9362 goto bad_address;
9363
9364 /* bndmk, bndldx, and bndstx have special restrictions. */
9365 if (current_templates->start->base_opcode == 0xf30f1b
9366 || (current_templates->start->base_opcode & ~1) == 0x0f1a)
9367 {
9368 /* They cannot use RIP-relative addressing. */
9369 if (i.base_reg && i.base_reg->reg_num == RegIP)
9370 {
9371 as_bad (_("`%s' cannot be used here"), operand_string);
9372 return 0;
9373 }
9374
9375 /* bndldx and bndstx ignore their scale factor. */
9376 if (current_templates->start->base_opcode != 0xf30f1b
9377 && i.log2_scale_factor)
9378 as_warn (_("register scaling is being ignored here"));
9379 }
9380 }
9381 else
9382 {
9383 /* 16-bit checks. */
9384 if ((i.base_reg
9385 && (!i.base_reg->reg_type.bitfield.word
9386 || !i.base_reg->reg_type.bitfield.baseindex))
9387 || (i.index_reg
9388 && (!i.index_reg->reg_type.bitfield.word
9389 || !i.index_reg->reg_type.bitfield.baseindex
9390 || !(i.base_reg
9391 && i.base_reg->reg_num < 6
9392 && i.index_reg->reg_num >= 6
9393 && i.log2_scale_factor == 0))))
9394 goto bad_address;
9395 }
9396 }
9397 return 1;
9398 }
9399
9400 /* Handle vector immediates. */
9401
9402 static int
9403 RC_SAE_immediate (const char *imm_start)
9404 {
9405 unsigned int match_found, j;
9406 const char *pstr = imm_start;
9407 expressionS *exp;
9408
9409 if (*pstr != '{')
9410 return 0;
9411
9412 pstr++;
9413 match_found = 0;
9414 for (j = 0; j < ARRAY_SIZE (RC_NamesTable); j++)
9415 {
9416 if (!strncmp (pstr, RC_NamesTable[j].name, RC_NamesTable[j].len))
9417 {
9418 if (!i.rounding)
9419 {
9420 rc_op.type = RC_NamesTable[j].type;
9421 rc_op.operand = this_operand;
9422 i.rounding = &rc_op;
9423 }
9424 else
9425 {
9426 as_bad (_("duplicated `%s'"), imm_start);
9427 return 0;
9428 }
9429 pstr += RC_NamesTable[j].len;
9430 match_found = 1;
9431 break;
9432 }
9433 }
9434 if (!match_found)
9435 return 0;
9436
9437 if (*pstr++ != '}')
9438 {
9439 as_bad (_("Missing '}': '%s'"), imm_start);
9440 return 0;
9441 }
9442 /* RC/SAE immediate string should contain nothing more. */;
9443 if (*pstr != 0)
9444 {
9445 as_bad (_("Junk after '}': '%s'"), imm_start);
9446 return 0;
9447 }
9448
9449 exp = &im_expressions[i.imm_operands++];
9450 i.op[this_operand].imms = exp;
9451
9452 exp->X_op = O_constant;
9453 exp->X_add_number = 0;
9454 exp->X_add_symbol = (symbolS *) 0;
9455 exp->X_op_symbol = (symbolS *) 0;
9456
9457 i.types[this_operand].bitfield.imm8 = 1;
9458 return 1;
9459 }
9460
9461 /* Only string instructions can have a second memory operand, so
9462 reduce current_templates to just those if it contains any. */
9463 static int
9464 maybe_adjust_templates (void)
9465 {
9466 const insn_template *t;
9467
9468 gas_assert (i.mem_operands == 1);
9469
9470 for (t = current_templates->start; t < current_templates->end; ++t)
9471 if (t->opcode_modifier.isstring)
9472 break;
9473
9474 if (t < current_templates->end)
9475 {
9476 static templates aux_templates;
9477 bfd_boolean recheck;
9478
9479 aux_templates.start = t;
9480 for (; t < current_templates->end; ++t)
9481 if (!t->opcode_modifier.isstring)
9482 break;
9483 aux_templates.end = t;
9484
9485 /* Determine whether to re-check the first memory operand. */
9486 recheck = (aux_templates.start != current_templates->start
9487 || t != current_templates->end);
9488
9489 current_templates = &aux_templates;
9490
9491 if (recheck)
9492 {
9493 i.mem_operands = 0;
9494 if (i.memop1_string != NULL
9495 && i386_index_check (i.memop1_string) == 0)
9496 return 0;
9497 i.mem_operands = 1;
9498 }
9499 }
9500
9501 return 1;
9502 }
9503
9504 /* Parse OPERAND_STRING into the i386_insn structure I. Returns zero
9505 on error. */
9506
9507 static int
9508 i386_att_operand (char *operand_string)
9509 {
9510 const reg_entry *r;
9511 char *end_op;
9512 char *op_string = operand_string;
9513
9514 if (is_space_char (*op_string))
9515 ++op_string;
9516
9517 /* We check for an absolute prefix (differentiating,
9518 for example, 'jmp pc_relative_label' from 'jmp *absolute_label'. */
9519 if (*op_string == ABSOLUTE_PREFIX)
9520 {
9521 ++op_string;
9522 if (is_space_char (*op_string))
9523 ++op_string;
9524 i.types[this_operand].bitfield.jumpabsolute = 1;
9525 }
9526
9527 /* Check if operand is a register. */
9528 if ((r = parse_register (op_string, &end_op)) != NULL)
9529 {
9530 i386_operand_type temp;
9531
9532 /* Check for a segment override by searching for ':' after a
9533 segment register. */
9534 op_string = end_op;
9535 if (is_space_char (*op_string))
9536 ++op_string;
9537 if (*op_string == ':'
9538 && (r->reg_type.bitfield.sreg2
9539 || r->reg_type.bitfield.sreg3))
9540 {
9541 switch (r->reg_num)
9542 {
9543 case 0:
9544 i.seg[i.mem_operands] = &es;
9545 break;
9546 case 1:
9547 i.seg[i.mem_operands] = &cs;
9548 break;
9549 case 2:
9550 i.seg[i.mem_operands] = &ss;
9551 break;
9552 case 3:
9553 i.seg[i.mem_operands] = &ds;
9554 break;
9555 case 4:
9556 i.seg[i.mem_operands] = &fs;
9557 break;
9558 case 5:
9559 i.seg[i.mem_operands] = &gs;
9560 break;
9561 }
9562
9563 /* Skip the ':' and whitespace. */
9564 ++op_string;
9565 if (is_space_char (*op_string))
9566 ++op_string;
9567
9568 if (!is_digit_char (*op_string)
9569 && !is_identifier_char (*op_string)
9570 && *op_string != '('
9571 && *op_string != ABSOLUTE_PREFIX)
9572 {
9573 as_bad (_("bad memory operand `%s'"), op_string);
9574 return 0;
9575 }
9576 /* Handle case of %es:*foo. */
9577 if (*op_string == ABSOLUTE_PREFIX)
9578 {
9579 ++op_string;
9580 if (is_space_char (*op_string))
9581 ++op_string;
9582 i.types[this_operand].bitfield.jumpabsolute = 1;
9583 }
9584 goto do_memory_reference;
9585 }
9586
9587 /* Handle vector operations. */
9588 if (*op_string == '{')
9589 {
9590 op_string = check_VecOperations (op_string, NULL);
9591 if (op_string == NULL)
9592 return 0;
9593 }
9594
9595 if (*op_string)
9596 {
9597 as_bad (_("junk `%s' after register"), op_string);
9598 return 0;
9599 }
9600 temp = r->reg_type;
9601 temp.bitfield.baseindex = 0;
9602 i.types[this_operand] = operand_type_or (i.types[this_operand],
9603 temp);
9604 i.types[this_operand].bitfield.unspecified = 0;
9605 i.op[this_operand].regs = r;
9606 i.reg_operands++;
9607 }
9608 else if (*op_string == REGISTER_PREFIX)
9609 {
9610 as_bad (_("bad register name `%s'"), op_string);
9611 return 0;
9612 }
9613 else if (*op_string == IMMEDIATE_PREFIX)
9614 {
9615 ++op_string;
9616 if (i.types[this_operand].bitfield.jumpabsolute)
9617 {
9618 as_bad (_("immediate operand illegal with absolute jump"));
9619 return 0;
9620 }
9621 if (!i386_immediate (op_string))
9622 return 0;
9623 }
9624 else if (RC_SAE_immediate (operand_string))
9625 {
9626 /* If it is a RC or SAE immediate, do nothing. */
9627 ;
9628 }
9629 else if (is_digit_char (*op_string)
9630 || is_identifier_char (*op_string)
9631 || *op_string == '"'
9632 || *op_string == '(')
9633 {
9634 /* This is a memory reference of some sort. */
9635 char *base_string;
9636
9637 /* Start and end of displacement string expression (if found). */
9638 char *displacement_string_start;
9639 char *displacement_string_end;
9640 char *vop_start;
9641
9642 do_memory_reference:
9643 if (i.mem_operands == 1 && !maybe_adjust_templates ())
9644 return 0;
9645 if ((i.mem_operands == 1
9646 && !current_templates->start->opcode_modifier.isstring)
9647 || i.mem_operands == 2)
9648 {
9649 as_bad (_("too many memory references for `%s'"),
9650 current_templates->start->name);
9651 return 0;
9652 }
9653
9654 /* Check for base index form. We detect the base index form by
9655 looking for an ')' at the end of the operand, searching
9656 for the '(' matching it, and finding a REGISTER_PREFIX or ','
9657 after the '('. */
9658 base_string = op_string + strlen (op_string);
9659
9660 /* Handle vector operations. */
9661 vop_start = strchr (op_string, '{');
9662 if (vop_start && vop_start < base_string)
9663 {
9664 if (check_VecOperations (vop_start, base_string) == NULL)
9665 return 0;
9666 base_string = vop_start;
9667 }
9668
9669 --base_string;
9670 if (is_space_char (*base_string))
9671 --base_string;
9672
9673 /* If we only have a displacement, set-up for it to be parsed later. */
9674 displacement_string_start = op_string;
9675 displacement_string_end = base_string + 1;
9676
9677 if (*base_string == ')')
9678 {
9679 char *temp_string;
9680 unsigned int parens_balanced = 1;
9681 /* We've already checked that the number of left & right ()'s are
9682 equal, so this loop will not be infinite. */
9683 do
9684 {
9685 base_string--;
9686 if (*base_string == ')')
9687 parens_balanced++;
9688 if (*base_string == '(')
9689 parens_balanced--;
9690 }
9691 while (parens_balanced);
9692
9693 temp_string = base_string;
9694
9695 /* Skip past '(' and whitespace. */
9696 ++base_string;
9697 if (is_space_char (*base_string))
9698 ++base_string;
9699
9700 if (*base_string == ','
9701 || ((i.base_reg = parse_register (base_string, &end_op))
9702 != NULL))
9703 {
9704 displacement_string_end = temp_string;
9705
9706 i.types[this_operand].bitfield.baseindex = 1;
9707
9708 if (i.base_reg)
9709 {
9710 base_string = end_op;
9711 if (is_space_char (*base_string))
9712 ++base_string;
9713 }
9714
9715 /* There may be an index reg or scale factor here. */
9716 if (*base_string == ',')
9717 {
9718 ++base_string;
9719 if (is_space_char (*base_string))
9720 ++base_string;
9721
9722 if ((i.index_reg = parse_register (base_string, &end_op))
9723 != NULL)
9724 {
9725 base_string = end_op;
9726 if (is_space_char (*base_string))
9727 ++base_string;
9728 if (*base_string == ',')
9729 {
9730 ++base_string;
9731 if (is_space_char (*base_string))
9732 ++base_string;
9733 }
9734 else if (*base_string != ')')
9735 {
9736 as_bad (_("expecting `,' or `)' "
9737 "after index register in `%s'"),
9738 operand_string);
9739 return 0;
9740 }
9741 }
9742 else if (*base_string == REGISTER_PREFIX)
9743 {
9744 end_op = strchr (base_string, ',');
9745 if (end_op)
9746 *end_op = '\0';
9747 as_bad (_("bad register name `%s'"), base_string);
9748 return 0;
9749 }
9750
9751 /* Check for scale factor. */
9752 if (*base_string != ')')
9753 {
9754 char *end_scale = i386_scale (base_string);
9755
9756 if (!end_scale)
9757 return 0;
9758
9759 base_string = end_scale;
9760 if (is_space_char (*base_string))
9761 ++base_string;
9762 if (*base_string != ')')
9763 {
9764 as_bad (_("expecting `)' "
9765 "after scale factor in `%s'"),
9766 operand_string);
9767 return 0;
9768 }
9769 }
9770 else if (!i.index_reg)
9771 {
9772 as_bad (_("expecting index register or scale factor "
9773 "after `,'; got '%c'"),
9774 *base_string);
9775 return 0;
9776 }
9777 }
9778 else if (*base_string != ')')
9779 {
9780 as_bad (_("expecting `,' or `)' "
9781 "after base register in `%s'"),
9782 operand_string);
9783 return 0;
9784 }
9785 }
9786 else if (*base_string == REGISTER_PREFIX)
9787 {
9788 end_op = strchr (base_string, ',');
9789 if (end_op)
9790 *end_op = '\0';
9791 as_bad (_("bad register name `%s'"), base_string);
9792 return 0;
9793 }
9794 }
9795
9796 /* If there's an expression beginning the operand, parse it,
9797 assuming displacement_string_start and
9798 displacement_string_end are meaningful. */
9799 if (displacement_string_start != displacement_string_end)
9800 {
9801 if (!i386_displacement (displacement_string_start,
9802 displacement_string_end))
9803 return 0;
9804 }
9805
9806 /* Special case for (%dx) while doing input/output op. */
9807 if (i.base_reg
9808 && i.base_reg->reg_type.bitfield.inoutportreg
9809 && i.index_reg == 0
9810 && i.log2_scale_factor == 0
9811 && i.seg[i.mem_operands] == 0
9812 && !operand_type_check (i.types[this_operand], disp))
9813 {
9814 i.types[this_operand] = i.base_reg->reg_type;
9815 return 1;
9816 }
9817
9818 if (i386_index_check (operand_string) == 0)
9819 return 0;
9820 i.flags[this_operand] |= Operand_Mem;
9821 if (i.mem_operands == 0)
9822 i.memop1_string = xstrdup (operand_string);
9823 i.mem_operands++;
9824 }
9825 else
9826 {
9827 /* It's not a memory operand; argh! */
9828 as_bad (_("invalid char %s beginning operand %d `%s'"),
9829 output_invalid (*op_string),
9830 this_operand + 1,
9831 op_string);
9832 return 0;
9833 }
9834 return 1; /* Normal return. */
9835 }
9836 \f
9837 /* Calculate the maximum variable size (i.e., excluding fr_fix)
9838 that an rs_machine_dependent frag may reach. */
9839
9840 unsigned int
9841 i386_frag_max_var (fragS *frag)
9842 {
9843 /* The only relaxable frags are for jumps.
9844 Unconditional jumps can grow by 4 bytes and others by 5 bytes. */
9845 gas_assert (frag->fr_type == rs_machine_dependent);
9846 return TYPE_FROM_RELAX_STATE (frag->fr_subtype) == UNCOND_JUMP ? 4 : 5;
9847 }
9848
9849 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
9850 static int
9851 elf_symbol_resolved_in_segment_p (symbolS *fr_symbol, offsetT fr_var)
9852 {
9853 /* STT_GNU_IFUNC symbol must go through PLT. */
9854 if ((symbol_get_bfdsym (fr_symbol)->flags
9855 & BSF_GNU_INDIRECT_FUNCTION) != 0)
9856 return 0;
9857
9858 if (!S_IS_EXTERNAL (fr_symbol))
9859 /* Symbol may be weak or local. */
9860 return !S_IS_WEAK (fr_symbol);
9861
9862 /* Global symbols with non-default visibility can't be preempted. */
9863 if (ELF_ST_VISIBILITY (S_GET_OTHER (fr_symbol)) != STV_DEFAULT)
9864 return 1;
9865
9866 if (fr_var != NO_RELOC)
9867 switch ((enum bfd_reloc_code_real) fr_var)
9868 {
9869 case BFD_RELOC_386_PLT32:
9870 case BFD_RELOC_X86_64_PLT32:
9871 /* Symbol with PLT relocation may be preempted. */
9872 return 0;
9873 default:
9874 abort ();
9875 }
9876
9877 /* Global symbols with default visibility in a shared library may be
9878 preempted by another definition. */
9879 return !shared;
9880 }
9881 #endif
9882
9883 /* md_estimate_size_before_relax()
9884
9885 Called just before relax() for rs_machine_dependent frags. The x86
9886 assembler uses these frags to handle variable size jump
9887 instructions.
9888
9889 Any symbol that is now undefined will not become defined.
9890 Return the correct fr_subtype in the frag.
9891 Return the initial "guess for variable size of frag" to caller.
9892 The guess is actually the growth beyond the fixed part. Whatever
9893 we do to grow the fixed or variable part contributes to our
9894 returned value. */
9895
9896 int
9897 md_estimate_size_before_relax (fragS *fragP, segT segment)
9898 {
9899 /* We've already got fragP->fr_subtype right; all we have to do is
9900 check for un-relaxable symbols. On an ELF system, we can't relax
9901 an externally visible symbol, because it may be overridden by a
9902 shared library. */
9903 if (S_GET_SEGMENT (fragP->fr_symbol) != segment
9904 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
9905 || (IS_ELF
9906 && !elf_symbol_resolved_in_segment_p (fragP->fr_symbol,
9907 fragP->fr_var))
9908 #endif
9909 #if defined (OBJ_COFF) && defined (TE_PE)
9910 || (OUTPUT_FLAVOR == bfd_target_coff_flavour
9911 && S_IS_WEAK (fragP->fr_symbol))
9912 #endif
9913 )
9914 {
9915 /* Symbol is undefined in this segment, or we need to keep a
9916 reloc so that weak symbols can be overridden. */
9917 int size = (fragP->fr_subtype & CODE16) ? 2 : 4;
9918 enum bfd_reloc_code_real reloc_type;
9919 unsigned char *opcode;
9920 int old_fr_fix;
9921
9922 if (fragP->fr_var != NO_RELOC)
9923 reloc_type = (enum bfd_reloc_code_real) fragP->fr_var;
9924 else if (size == 2)
9925 reloc_type = BFD_RELOC_16_PCREL;
9926 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
9927 else if (need_plt32_p (fragP->fr_symbol))
9928 reloc_type = BFD_RELOC_X86_64_PLT32;
9929 #endif
9930 else
9931 reloc_type = BFD_RELOC_32_PCREL;
9932
9933 old_fr_fix = fragP->fr_fix;
9934 opcode = (unsigned char *) fragP->fr_opcode;
9935
9936 switch (TYPE_FROM_RELAX_STATE (fragP->fr_subtype))
9937 {
9938 case UNCOND_JUMP:
9939 /* Make jmp (0xeb) a (d)word displacement jump. */
9940 opcode[0] = 0xe9;
9941 fragP->fr_fix += size;
9942 fix_new (fragP, old_fr_fix, size,
9943 fragP->fr_symbol,
9944 fragP->fr_offset, 1,
9945 reloc_type);
9946 break;
9947
9948 case COND_JUMP86:
9949 if (size == 2
9950 && (!no_cond_jump_promotion || fragP->fr_var != NO_RELOC))
9951 {
9952 /* Negate the condition, and branch past an
9953 unconditional jump. */
9954 opcode[0] ^= 1;
9955 opcode[1] = 3;
9956 /* Insert an unconditional jump. */
9957 opcode[2] = 0xe9;
9958 /* We added two extra opcode bytes, and have a two byte
9959 offset. */
9960 fragP->fr_fix += 2 + 2;
9961 fix_new (fragP, old_fr_fix + 2, 2,
9962 fragP->fr_symbol,
9963 fragP->fr_offset, 1,
9964 reloc_type);
9965 break;
9966 }
9967 /* Fall through. */
9968
9969 case COND_JUMP:
9970 if (no_cond_jump_promotion && fragP->fr_var == NO_RELOC)
9971 {
9972 fixS *fixP;
9973
9974 fragP->fr_fix += 1;
9975 fixP = fix_new (fragP, old_fr_fix, 1,
9976 fragP->fr_symbol,
9977 fragP->fr_offset, 1,
9978 BFD_RELOC_8_PCREL);
9979 fixP->fx_signed = 1;
9980 break;
9981 }
9982
9983 /* This changes the byte-displacement jump 0x7N
9984 to the (d)word-displacement jump 0x0f,0x8N. */
9985 opcode[1] = opcode[0] + 0x10;
9986 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
9987 /* We've added an opcode byte. */
9988 fragP->fr_fix += 1 + size;
9989 fix_new (fragP, old_fr_fix + 1, size,
9990 fragP->fr_symbol,
9991 fragP->fr_offset, 1,
9992 reloc_type);
9993 break;
9994
9995 default:
9996 BAD_CASE (fragP->fr_subtype);
9997 break;
9998 }
9999 frag_wane (fragP);
10000 return fragP->fr_fix - old_fr_fix;
10001 }
10002
10003 /* Guess size depending on current relax state. Initially the relax
10004 state will correspond to a short jump and we return 1, because
10005 the variable part of the frag (the branch offset) is one byte
10006 long. However, we can relax a section more than once and in that
10007 case we must either set fr_subtype back to the unrelaxed state,
10008 or return the value for the appropriate branch. */
10009 return md_relax_table[fragP->fr_subtype].rlx_length;
10010 }
10011
10012 /* Called after relax() is finished.
10013
10014 In: Address of frag.
10015 fr_type == rs_machine_dependent.
10016 fr_subtype is what the address relaxed to.
10017
10018 Out: Any fixSs and constants are set up.
10019 Caller will turn frag into a ".space 0". */
10020
10021 void
10022 md_convert_frag (bfd *abfd ATTRIBUTE_UNUSED, segT sec ATTRIBUTE_UNUSED,
10023 fragS *fragP)
10024 {
10025 unsigned char *opcode;
10026 unsigned char *where_to_put_displacement = NULL;
10027 offsetT target_address;
10028 offsetT opcode_address;
10029 unsigned int extension = 0;
10030 offsetT displacement_from_opcode_start;
10031
10032 opcode = (unsigned char *) fragP->fr_opcode;
10033
10034 /* Address we want to reach in file space. */
10035 target_address = S_GET_VALUE (fragP->fr_symbol) + fragP->fr_offset;
10036
10037 /* Address opcode resides at in file space. */
10038 opcode_address = fragP->fr_address + fragP->fr_fix;
10039
10040 /* Displacement from opcode start to fill into instruction. */
10041 displacement_from_opcode_start = target_address - opcode_address;
10042
10043 if ((fragP->fr_subtype & BIG) == 0)
10044 {
10045 /* Don't have to change opcode. */
10046 extension = 1; /* 1 opcode + 1 displacement */
10047 where_to_put_displacement = &opcode[1];
10048 }
10049 else
10050 {
10051 if (no_cond_jump_promotion
10052 && TYPE_FROM_RELAX_STATE (fragP->fr_subtype) != UNCOND_JUMP)
10053 as_warn_where (fragP->fr_file, fragP->fr_line,
10054 _("long jump required"));
10055
10056 switch (fragP->fr_subtype)
10057 {
10058 case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG):
10059 extension = 4; /* 1 opcode + 4 displacement */
10060 opcode[0] = 0xe9;
10061 where_to_put_displacement = &opcode[1];
10062 break;
10063
10064 case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16):
10065 extension = 2; /* 1 opcode + 2 displacement */
10066 opcode[0] = 0xe9;
10067 where_to_put_displacement = &opcode[1];
10068 break;
10069
10070 case ENCODE_RELAX_STATE (COND_JUMP, BIG):
10071 case ENCODE_RELAX_STATE (COND_JUMP86, BIG):
10072 extension = 5; /* 2 opcode + 4 displacement */
10073 opcode[1] = opcode[0] + 0x10;
10074 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
10075 where_to_put_displacement = &opcode[2];
10076 break;
10077
10078 case ENCODE_RELAX_STATE (COND_JUMP, BIG16):
10079 extension = 3; /* 2 opcode + 2 displacement */
10080 opcode[1] = opcode[0] + 0x10;
10081 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
10082 where_to_put_displacement = &opcode[2];
10083 break;
10084
10085 case ENCODE_RELAX_STATE (COND_JUMP86, BIG16):
10086 extension = 4;
10087 opcode[0] ^= 1;
10088 opcode[1] = 3;
10089 opcode[2] = 0xe9;
10090 where_to_put_displacement = &opcode[3];
10091 break;
10092
10093 default:
10094 BAD_CASE (fragP->fr_subtype);
10095 break;
10096 }
10097 }
10098
10099 /* If size if less then four we are sure that the operand fits,
10100 but if it's 4, then it could be that the displacement is larger
10101 then -/+ 2GB. */
10102 if (DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype) == 4
10103 && object_64bit
10104 && ((addressT) (displacement_from_opcode_start - extension
10105 + ((addressT) 1 << 31))
10106 > (((addressT) 2 << 31) - 1)))
10107 {
10108 as_bad_where (fragP->fr_file, fragP->fr_line,
10109 _("jump target out of range"));
10110 /* Make us emit 0. */
10111 displacement_from_opcode_start = extension;
10112 }
10113 /* Now put displacement after opcode. */
10114 md_number_to_chars ((char *) where_to_put_displacement,
10115 (valueT) (displacement_from_opcode_start - extension),
10116 DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype));
10117 fragP->fr_fix += extension;
10118 }
10119 \f
10120 /* Apply a fixup (fixP) to segment data, once it has been determined
10121 by our caller that we have all the info we need to fix it up.
10122
10123 Parameter valP is the pointer to the value of the bits.
10124
10125 On the 386, immediates, displacements, and data pointers are all in
10126 the same (little-endian) format, so we don't need to care about which
10127 we are handling. */
10128
10129 void
10130 md_apply_fix (fixS *fixP, valueT *valP, segT seg ATTRIBUTE_UNUSED)
10131 {
10132 char *p = fixP->fx_where + fixP->fx_frag->fr_literal;
10133 valueT value = *valP;
10134
10135 #if !defined (TE_Mach)
10136 if (fixP->fx_pcrel)
10137 {
10138 switch (fixP->fx_r_type)
10139 {
10140 default:
10141 break;
10142
10143 case BFD_RELOC_64:
10144 fixP->fx_r_type = BFD_RELOC_64_PCREL;
10145 break;
10146 case BFD_RELOC_32:
10147 case BFD_RELOC_X86_64_32S:
10148 fixP->fx_r_type = BFD_RELOC_32_PCREL;
10149 break;
10150 case BFD_RELOC_16:
10151 fixP->fx_r_type = BFD_RELOC_16_PCREL;
10152 break;
10153 case BFD_RELOC_8:
10154 fixP->fx_r_type = BFD_RELOC_8_PCREL;
10155 break;
10156 }
10157 }
10158
10159 if (fixP->fx_addsy != NULL
10160 && (fixP->fx_r_type == BFD_RELOC_32_PCREL
10161 || fixP->fx_r_type == BFD_RELOC_64_PCREL
10162 || fixP->fx_r_type == BFD_RELOC_16_PCREL
10163 || fixP->fx_r_type == BFD_RELOC_8_PCREL)
10164 && !use_rela_relocations)
10165 {
10166 /* This is a hack. There should be a better way to handle this.
10167 This covers for the fact that bfd_install_relocation will
10168 subtract the current location (for partial_inplace, PC relative
10169 relocations); see more below. */
10170 #ifndef OBJ_AOUT
10171 if (IS_ELF
10172 #ifdef TE_PE
10173 || OUTPUT_FLAVOR == bfd_target_coff_flavour
10174 #endif
10175 )
10176 value += fixP->fx_where + fixP->fx_frag->fr_address;
10177 #endif
10178 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
10179 if (IS_ELF)
10180 {
10181 segT sym_seg = S_GET_SEGMENT (fixP->fx_addsy);
10182
10183 if ((sym_seg == seg
10184 || (symbol_section_p (fixP->fx_addsy)
10185 && sym_seg != absolute_section))
10186 && !generic_force_reloc (fixP))
10187 {
10188 /* Yes, we add the values in twice. This is because
10189 bfd_install_relocation subtracts them out again. I think
10190 bfd_install_relocation is broken, but I don't dare change
10191 it. FIXME. */
10192 value += fixP->fx_where + fixP->fx_frag->fr_address;
10193 }
10194 }
10195 #endif
10196 #if defined (OBJ_COFF) && defined (TE_PE)
10197 /* For some reason, the PE format does not store a
10198 section address offset for a PC relative symbol. */
10199 if (S_GET_SEGMENT (fixP->fx_addsy) != seg
10200 || S_IS_WEAK (fixP->fx_addsy))
10201 value += md_pcrel_from (fixP);
10202 #endif
10203 }
10204 #if defined (OBJ_COFF) && defined (TE_PE)
10205 if (fixP->fx_addsy != NULL
10206 && S_IS_WEAK (fixP->fx_addsy)
10207 /* PR 16858: Do not modify weak function references. */
10208 && ! fixP->fx_pcrel)
10209 {
10210 #if !defined (TE_PEP)
10211 /* For x86 PE weak function symbols are neither PC-relative
10212 nor do they set S_IS_FUNCTION. So the only reliable way
10213 to detect them is to check the flags of their containing
10214 section. */
10215 if (S_GET_SEGMENT (fixP->fx_addsy) != NULL
10216 && S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_CODE)
10217 ;
10218 else
10219 #endif
10220 value -= S_GET_VALUE (fixP->fx_addsy);
10221 }
10222 #endif
10223
10224 /* Fix a few things - the dynamic linker expects certain values here,
10225 and we must not disappoint it. */
10226 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
10227 if (IS_ELF && fixP->fx_addsy)
10228 switch (fixP->fx_r_type)
10229 {
10230 case BFD_RELOC_386_PLT32:
10231 case BFD_RELOC_X86_64_PLT32:
10232 /* Make the jump instruction point to the address of the operand. At
10233 runtime we merely add the offset to the actual PLT entry. */
10234 value = -4;
10235 break;
10236
10237 case BFD_RELOC_386_TLS_GD:
10238 case BFD_RELOC_386_TLS_LDM:
10239 case BFD_RELOC_386_TLS_IE_32:
10240 case BFD_RELOC_386_TLS_IE:
10241 case BFD_RELOC_386_TLS_GOTIE:
10242 case BFD_RELOC_386_TLS_GOTDESC:
10243 case BFD_RELOC_X86_64_TLSGD:
10244 case BFD_RELOC_X86_64_TLSLD:
10245 case BFD_RELOC_X86_64_GOTTPOFF:
10246 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
10247 value = 0; /* Fully resolved at runtime. No addend. */
10248 /* Fallthrough */
10249 case BFD_RELOC_386_TLS_LE:
10250 case BFD_RELOC_386_TLS_LDO_32:
10251 case BFD_RELOC_386_TLS_LE_32:
10252 case BFD_RELOC_X86_64_DTPOFF32:
10253 case BFD_RELOC_X86_64_DTPOFF64:
10254 case BFD_RELOC_X86_64_TPOFF32:
10255 case BFD_RELOC_X86_64_TPOFF64:
10256 S_SET_THREAD_LOCAL (fixP->fx_addsy);
10257 break;
10258
10259 case BFD_RELOC_386_TLS_DESC_CALL:
10260 case BFD_RELOC_X86_64_TLSDESC_CALL:
10261 value = 0; /* Fully resolved at runtime. No addend. */
10262 S_SET_THREAD_LOCAL (fixP->fx_addsy);
10263 fixP->fx_done = 0;
10264 return;
10265
10266 case BFD_RELOC_VTABLE_INHERIT:
10267 case BFD_RELOC_VTABLE_ENTRY:
10268 fixP->fx_done = 0;
10269 return;
10270
10271 default:
10272 break;
10273 }
10274 #endif /* defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) */
10275 *valP = value;
10276 #endif /* !defined (TE_Mach) */
10277
10278 /* Are we finished with this relocation now? */
10279 if (fixP->fx_addsy == NULL)
10280 fixP->fx_done = 1;
10281 #if defined (OBJ_COFF) && defined (TE_PE)
10282 else if (fixP->fx_addsy != NULL && S_IS_WEAK (fixP->fx_addsy))
10283 {
10284 fixP->fx_done = 0;
10285 /* Remember value for tc_gen_reloc. */
10286 fixP->fx_addnumber = value;
10287 /* Clear out the frag for now. */
10288 value = 0;
10289 }
10290 #endif
10291 else if (use_rela_relocations)
10292 {
10293 fixP->fx_no_overflow = 1;
10294 /* Remember value for tc_gen_reloc. */
10295 fixP->fx_addnumber = value;
10296 value = 0;
10297 }
10298
10299 md_number_to_chars (p, value, fixP->fx_size);
10300 }
10301 \f
10302 const char *
10303 md_atof (int type, char *litP, int *sizeP)
10304 {
10305 /* This outputs the LITTLENUMs in REVERSE order;
10306 in accord with the bigendian 386. */
10307 return ieee_md_atof (type, litP, sizeP, FALSE);
10308 }
10309 \f
10310 static char output_invalid_buf[sizeof (unsigned char) * 2 + 6];
10311
10312 static char *
10313 output_invalid (int c)
10314 {
10315 if (ISPRINT (c))
10316 snprintf (output_invalid_buf, sizeof (output_invalid_buf),
10317 "'%c'", c);
10318 else
10319 snprintf (output_invalid_buf, sizeof (output_invalid_buf),
10320 "(0x%x)", (unsigned char) c);
10321 return output_invalid_buf;
10322 }
10323
10324 /* REG_STRING starts *before* REGISTER_PREFIX. */
10325
10326 static const reg_entry *
10327 parse_real_register (char *reg_string, char **end_op)
10328 {
10329 char *s = reg_string;
10330 char *p;
10331 char reg_name_given[MAX_REG_NAME_SIZE + 1];
10332 const reg_entry *r;
10333
10334 /* Skip possible REGISTER_PREFIX and possible whitespace. */
10335 if (*s == REGISTER_PREFIX)
10336 ++s;
10337
10338 if (is_space_char (*s))
10339 ++s;
10340
10341 p = reg_name_given;
10342 while ((*p++ = register_chars[(unsigned char) *s]) != '\0')
10343 {
10344 if (p >= reg_name_given + MAX_REG_NAME_SIZE)
10345 return (const reg_entry *) NULL;
10346 s++;
10347 }
10348
10349 /* For naked regs, make sure that we are not dealing with an identifier.
10350 This prevents confusing an identifier like `eax_var' with register
10351 `eax'. */
10352 if (allow_naked_reg && identifier_chars[(unsigned char) *s])
10353 return (const reg_entry *) NULL;
10354
10355 *end_op = s;
10356
10357 r = (const reg_entry *) hash_find (reg_hash, reg_name_given);
10358
10359 /* Handle floating point regs, allowing spaces in the (i) part. */
10360 if (r == i386_regtab /* %st is first entry of table */)
10361 {
10362 if (!cpu_arch_flags.bitfield.cpu8087
10363 && !cpu_arch_flags.bitfield.cpu287
10364 && !cpu_arch_flags.bitfield.cpu387)
10365 return (const reg_entry *) NULL;
10366
10367 if (is_space_char (*s))
10368 ++s;
10369 if (*s == '(')
10370 {
10371 ++s;
10372 if (is_space_char (*s))
10373 ++s;
10374 if (*s >= '0' && *s <= '7')
10375 {
10376 int fpr = *s - '0';
10377 ++s;
10378 if (is_space_char (*s))
10379 ++s;
10380 if (*s == ')')
10381 {
10382 *end_op = s + 1;
10383 r = (const reg_entry *) hash_find (reg_hash, "st(0)");
10384 know (r);
10385 return r + fpr;
10386 }
10387 }
10388 /* We have "%st(" then garbage. */
10389 return (const reg_entry *) NULL;
10390 }
10391 }
10392
10393 if (r == NULL || allow_pseudo_reg)
10394 return r;
10395
10396 if (operand_type_all_zero (&r->reg_type))
10397 return (const reg_entry *) NULL;
10398
10399 if ((r->reg_type.bitfield.dword
10400 || r->reg_type.bitfield.sreg3
10401 || r->reg_type.bitfield.control
10402 || r->reg_type.bitfield.debug
10403 || r->reg_type.bitfield.test)
10404 && !cpu_arch_flags.bitfield.cpui386)
10405 return (const reg_entry *) NULL;
10406
10407 if (r->reg_type.bitfield.regmmx && !cpu_arch_flags.bitfield.cpummx)
10408 return (const reg_entry *) NULL;
10409
10410 if (!cpu_arch_flags.bitfield.cpuavx512f)
10411 {
10412 if (r->reg_type.bitfield.zmmword || r->reg_type.bitfield.regmask)
10413 return (const reg_entry *) NULL;
10414
10415 if (!cpu_arch_flags.bitfield.cpuavx)
10416 {
10417 if (r->reg_type.bitfield.ymmword)
10418 return (const reg_entry *) NULL;
10419
10420 if (!cpu_arch_flags.bitfield.cpusse && r->reg_type.bitfield.xmmword)
10421 return (const reg_entry *) NULL;
10422 }
10423 }
10424
10425 if (r->reg_type.bitfield.regbnd && !cpu_arch_flags.bitfield.cpumpx)
10426 return (const reg_entry *) NULL;
10427
10428 /* Don't allow fake index register unless allow_index_reg isn't 0. */
10429 if (!allow_index_reg && r->reg_num == RegIZ)
10430 return (const reg_entry *) NULL;
10431
10432 /* Upper 16 vector registers are only available with VREX in 64bit
10433 mode, and require EVEX encoding. */
10434 if (r->reg_flags & RegVRex)
10435 {
10436 if (!cpu_arch_flags.bitfield.cpuavx512f
10437 || flag_code != CODE_64BIT)
10438 return (const reg_entry *) NULL;
10439
10440 i.vec_encoding = vex_encoding_evex;
10441 }
10442
10443 if (((r->reg_flags & (RegRex64 | RegRex)) || r->reg_type.bitfield.qword)
10444 && (!cpu_arch_flags.bitfield.cpulm || !r->reg_type.bitfield.control)
10445 && flag_code != CODE_64BIT)
10446 return (const reg_entry *) NULL;
10447
10448 if (r->reg_type.bitfield.sreg3 && r->reg_num == RegFlat && !intel_syntax)
10449 return (const reg_entry *) NULL;
10450
10451 return r;
10452 }
10453
10454 /* REG_STRING starts *before* REGISTER_PREFIX. */
10455
10456 static const reg_entry *
10457 parse_register (char *reg_string, char **end_op)
10458 {
10459 const reg_entry *r;
10460
10461 if (*reg_string == REGISTER_PREFIX || allow_naked_reg)
10462 r = parse_real_register (reg_string, end_op);
10463 else
10464 r = NULL;
10465 if (!r)
10466 {
10467 char *save = input_line_pointer;
10468 char c;
10469 symbolS *symbolP;
10470
10471 input_line_pointer = reg_string;
10472 c = get_symbol_name (&reg_string);
10473 symbolP = symbol_find (reg_string);
10474 if (symbolP && S_GET_SEGMENT (symbolP) == reg_section)
10475 {
10476 const expressionS *e = symbol_get_value_expression (symbolP);
10477
10478 know (e->X_op == O_register);
10479 know (e->X_add_number >= 0
10480 && (valueT) e->X_add_number < i386_regtab_size);
10481 r = i386_regtab + e->X_add_number;
10482 if ((r->reg_flags & RegVRex))
10483 i.vec_encoding = vex_encoding_evex;
10484 *end_op = input_line_pointer;
10485 }
10486 *input_line_pointer = c;
10487 input_line_pointer = save;
10488 }
10489 return r;
10490 }
10491
10492 int
10493 i386_parse_name (char *name, expressionS *e, char *nextcharP)
10494 {
10495 const reg_entry *r;
10496 char *end = input_line_pointer;
10497
10498 *end = *nextcharP;
10499 r = parse_register (name, &input_line_pointer);
10500 if (r && end <= input_line_pointer)
10501 {
10502 *nextcharP = *input_line_pointer;
10503 *input_line_pointer = 0;
10504 e->X_op = O_register;
10505 e->X_add_number = r - i386_regtab;
10506 return 1;
10507 }
10508 input_line_pointer = end;
10509 *end = 0;
10510 return intel_syntax ? i386_intel_parse_name (name, e) : 0;
10511 }
10512
10513 void
10514 md_operand (expressionS *e)
10515 {
10516 char *end;
10517 const reg_entry *r;
10518
10519 switch (*input_line_pointer)
10520 {
10521 case REGISTER_PREFIX:
10522 r = parse_real_register (input_line_pointer, &end);
10523 if (r)
10524 {
10525 e->X_op = O_register;
10526 e->X_add_number = r - i386_regtab;
10527 input_line_pointer = end;
10528 }
10529 break;
10530
10531 case '[':
10532 gas_assert (intel_syntax);
10533 end = input_line_pointer++;
10534 expression (e);
10535 if (*input_line_pointer == ']')
10536 {
10537 ++input_line_pointer;
10538 e->X_op_symbol = make_expr_symbol (e);
10539 e->X_add_symbol = NULL;
10540 e->X_add_number = 0;
10541 e->X_op = O_index;
10542 }
10543 else
10544 {
10545 e->X_op = O_absent;
10546 input_line_pointer = end;
10547 }
10548 break;
10549 }
10550 }
10551
10552 \f
10553 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
10554 const char *md_shortopts = "kVQ:sqnO::";
10555 #else
10556 const char *md_shortopts = "qnO::";
10557 #endif
10558
10559 #define OPTION_32 (OPTION_MD_BASE + 0)
10560 #define OPTION_64 (OPTION_MD_BASE + 1)
10561 #define OPTION_DIVIDE (OPTION_MD_BASE + 2)
10562 #define OPTION_MARCH (OPTION_MD_BASE + 3)
10563 #define OPTION_MTUNE (OPTION_MD_BASE + 4)
10564 #define OPTION_MMNEMONIC (OPTION_MD_BASE + 5)
10565 #define OPTION_MSYNTAX (OPTION_MD_BASE + 6)
10566 #define OPTION_MINDEX_REG (OPTION_MD_BASE + 7)
10567 #define OPTION_MNAKED_REG (OPTION_MD_BASE + 8)
10568 #define OPTION_MRELAX_RELOCATIONS (OPTION_MD_BASE + 9)
10569 #define OPTION_MSSE2AVX (OPTION_MD_BASE + 10)
10570 #define OPTION_MSSE_CHECK (OPTION_MD_BASE + 11)
10571 #define OPTION_MOPERAND_CHECK (OPTION_MD_BASE + 12)
10572 #define OPTION_MAVXSCALAR (OPTION_MD_BASE + 13)
10573 #define OPTION_X32 (OPTION_MD_BASE + 14)
10574 #define OPTION_MADD_BND_PREFIX (OPTION_MD_BASE + 15)
10575 #define OPTION_MEVEXLIG (OPTION_MD_BASE + 16)
10576 #define OPTION_MEVEXWIG (OPTION_MD_BASE + 17)
10577 #define OPTION_MBIG_OBJ (OPTION_MD_BASE + 18)
10578 #define OPTION_MOMIT_LOCK_PREFIX (OPTION_MD_BASE + 19)
10579 #define OPTION_MEVEXRCIG (OPTION_MD_BASE + 20)
10580 #define OPTION_MSHARED (OPTION_MD_BASE + 21)
10581 #define OPTION_MAMD64 (OPTION_MD_BASE + 22)
10582 #define OPTION_MINTEL64 (OPTION_MD_BASE + 23)
10583 #define OPTION_MFENCE_AS_LOCK_ADD (OPTION_MD_BASE + 24)
10584
10585 struct option md_longopts[] =
10586 {
10587 {"32", no_argument, NULL, OPTION_32},
10588 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
10589 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
10590 {"64", no_argument, NULL, OPTION_64},
10591 #endif
10592 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
10593 {"x32", no_argument, NULL, OPTION_X32},
10594 {"mshared", no_argument, NULL, OPTION_MSHARED},
10595 #endif
10596 {"divide", no_argument, NULL, OPTION_DIVIDE},
10597 {"march", required_argument, NULL, OPTION_MARCH},
10598 {"mtune", required_argument, NULL, OPTION_MTUNE},
10599 {"mmnemonic", required_argument, NULL, OPTION_MMNEMONIC},
10600 {"msyntax", required_argument, NULL, OPTION_MSYNTAX},
10601 {"mindex-reg", no_argument, NULL, OPTION_MINDEX_REG},
10602 {"mnaked-reg", no_argument, NULL, OPTION_MNAKED_REG},
10603 {"msse2avx", no_argument, NULL, OPTION_MSSE2AVX},
10604 {"msse-check", required_argument, NULL, OPTION_MSSE_CHECK},
10605 {"moperand-check", required_argument, NULL, OPTION_MOPERAND_CHECK},
10606 {"mavxscalar", required_argument, NULL, OPTION_MAVXSCALAR},
10607 {"madd-bnd-prefix", no_argument, NULL, OPTION_MADD_BND_PREFIX},
10608 {"mevexlig", required_argument, NULL, OPTION_MEVEXLIG},
10609 {"mevexwig", required_argument, NULL, OPTION_MEVEXWIG},
10610 # if defined (TE_PE) || defined (TE_PEP)
10611 {"mbig-obj", no_argument, NULL, OPTION_MBIG_OBJ},
10612 #endif
10613 {"momit-lock-prefix", required_argument, NULL, OPTION_MOMIT_LOCK_PREFIX},
10614 {"mfence-as-lock-add", required_argument, NULL, OPTION_MFENCE_AS_LOCK_ADD},
10615 {"mrelax-relocations", required_argument, NULL, OPTION_MRELAX_RELOCATIONS},
10616 {"mevexrcig", required_argument, NULL, OPTION_MEVEXRCIG},
10617 {"mamd64", no_argument, NULL, OPTION_MAMD64},
10618 {"mintel64", no_argument, NULL, OPTION_MINTEL64},
10619 {NULL, no_argument, NULL, 0}
10620 };
10621 size_t md_longopts_size = sizeof (md_longopts);
10622
10623 int
10624 md_parse_option (int c, const char *arg)
10625 {
10626 unsigned int j;
10627 char *arch, *next, *saved;
10628
10629 switch (c)
10630 {
10631 case 'n':
10632 optimize_align_code = 0;
10633 break;
10634
10635 case 'q':
10636 quiet_warnings = 1;
10637 break;
10638
10639 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
10640 /* -Qy, -Qn: SVR4 arguments controlling whether a .comment section
10641 should be emitted or not. FIXME: Not implemented. */
10642 case 'Q':
10643 break;
10644
10645 /* -V: SVR4 argument to print version ID. */
10646 case 'V':
10647 print_version_id ();
10648 break;
10649
10650 /* -k: Ignore for FreeBSD compatibility. */
10651 case 'k':
10652 break;
10653
10654 case 's':
10655 /* -s: On i386 Solaris, this tells the native assembler to use
10656 .stab instead of .stab.excl. We always use .stab anyhow. */
10657 break;
10658
10659 case OPTION_MSHARED:
10660 shared = 1;
10661 break;
10662 #endif
10663 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
10664 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
10665 case OPTION_64:
10666 {
10667 const char **list, **l;
10668
10669 list = bfd_target_list ();
10670 for (l = list; *l != NULL; l++)
10671 if (CONST_STRNEQ (*l, "elf64-x86-64")
10672 || strcmp (*l, "coff-x86-64") == 0
10673 || strcmp (*l, "pe-x86-64") == 0
10674 || strcmp (*l, "pei-x86-64") == 0
10675 || strcmp (*l, "mach-o-x86-64") == 0)
10676 {
10677 default_arch = "x86_64";
10678 break;
10679 }
10680 if (*l == NULL)
10681 as_fatal (_("no compiled in support for x86_64"));
10682 free (list);
10683 }
10684 break;
10685 #endif
10686
10687 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
10688 case OPTION_X32:
10689 if (IS_ELF)
10690 {
10691 const char **list, **l;
10692
10693 list = bfd_target_list ();
10694 for (l = list; *l != NULL; l++)
10695 if (CONST_STRNEQ (*l, "elf32-x86-64"))
10696 {
10697 default_arch = "x86_64:32";
10698 break;
10699 }
10700 if (*l == NULL)
10701 as_fatal (_("no compiled in support for 32bit x86_64"));
10702 free (list);
10703 }
10704 else
10705 as_fatal (_("32bit x86_64 is only supported for ELF"));
10706 break;
10707 #endif
10708
10709 case OPTION_32:
10710 default_arch = "i386";
10711 break;
10712
10713 case OPTION_DIVIDE:
10714 #ifdef SVR4_COMMENT_CHARS
10715 {
10716 char *n, *t;
10717 const char *s;
10718
10719 n = XNEWVEC (char, strlen (i386_comment_chars) + 1);
10720 t = n;
10721 for (s = i386_comment_chars; *s != '\0'; s++)
10722 if (*s != '/')
10723 *t++ = *s;
10724 *t = '\0';
10725 i386_comment_chars = n;
10726 }
10727 #endif
10728 break;
10729
10730 case OPTION_MARCH:
10731 saved = xstrdup (arg);
10732 arch = saved;
10733 /* Allow -march=+nosse. */
10734 if (*arch == '+')
10735 arch++;
10736 do
10737 {
10738 if (*arch == '.')
10739 as_fatal (_("invalid -march= option: `%s'"), arg);
10740 next = strchr (arch, '+');
10741 if (next)
10742 *next++ = '\0';
10743 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
10744 {
10745 if (strcmp (arch, cpu_arch [j].name) == 0)
10746 {
10747 /* Processor. */
10748 if (! cpu_arch[j].flags.bitfield.cpui386)
10749 continue;
10750
10751 cpu_arch_name = cpu_arch[j].name;
10752 cpu_sub_arch_name = NULL;
10753 cpu_arch_flags = cpu_arch[j].flags;
10754 cpu_arch_isa = cpu_arch[j].type;
10755 cpu_arch_isa_flags = cpu_arch[j].flags;
10756 if (!cpu_arch_tune_set)
10757 {
10758 cpu_arch_tune = cpu_arch_isa;
10759 cpu_arch_tune_flags = cpu_arch_isa_flags;
10760 }
10761 break;
10762 }
10763 else if (*cpu_arch [j].name == '.'
10764 && strcmp (arch, cpu_arch [j].name + 1) == 0)
10765 {
10766 /* ISA extension. */
10767 i386_cpu_flags flags;
10768
10769 flags = cpu_flags_or (cpu_arch_flags,
10770 cpu_arch[j].flags);
10771
10772 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
10773 {
10774 if (cpu_sub_arch_name)
10775 {
10776 char *name = cpu_sub_arch_name;
10777 cpu_sub_arch_name = concat (name,
10778 cpu_arch[j].name,
10779 (const char *) NULL);
10780 free (name);
10781 }
10782 else
10783 cpu_sub_arch_name = xstrdup (cpu_arch[j].name);
10784 cpu_arch_flags = flags;
10785 cpu_arch_isa_flags = flags;
10786 }
10787 else
10788 cpu_arch_isa_flags
10789 = cpu_flags_or (cpu_arch_isa_flags,
10790 cpu_arch[j].flags);
10791 break;
10792 }
10793 }
10794
10795 if (j >= ARRAY_SIZE (cpu_arch))
10796 {
10797 /* Disable an ISA extension. */
10798 for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
10799 if (strcmp (arch, cpu_noarch [j].name) == 0)
10800 {
10801 i386_cpu_flags flags;
10802
10803 flags = cpu_flags_and_not (cpu_arch_flags,
10804 cpu_noarch[j].flags);
10805 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
10806 {
10807 if (cpu_sub_arch_name)
10808 {
10809 char *name = cpu_sub_arch_name;
10810 cpu_sub_arch_name = concat (arch,
10811 (const char *) NULL);
10812 free (name);
10813 }
10814 else
10815 cpu_sub_arch_name = xstrdup (arch);
10816 cpu_arch_flags = flags;
10817 cpu_arch_isa_flags = flags;
10818 }
10819 break;
10820 }
10821
10822 if (j >= ARRAY_SIZE (cpu_noarch))
10823 j = ARRAY_SIZE (cpu_arch);
10824 }
10825
10826 if (j >= ARRAY_SIZE (cpu_arch))
10827 as_fatal (_("invalid -march= option: `%s'"), arg);
10828
10829 arch = next;
10830 }
10831 while (next != NULL);
10832 free (saved);
10833 break;
10834
10835 case OPTION_MTUNE:
10836 if (*arg == '.')
10837 as_fatal (_("invalid -mtune= option: `%s'"), arg);
10838 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
10839 {
10840 if (strcmp (arg, cpu_arch [j].name) == 0)
10841 {
10842 cpu_arch_tune_set = 1;
10843 cpu_arch_tune = cpu_arch [j].type;
10844 cpu_arch_tune_flags = cpu_arch[j].flags;
10845 break;
10846 }
10847 }
10848 if (j >= ARRAY_SIZE (cpu_arch))
10849 as_fatal (_("invalid -mtune= option: `%s'"), arg);
10850 break;
10851
10852 case OPTION_MMNEMONIC:
10853 if (strcasecmp (arg, "att") == 0)
10854 intel_mnemonic = 0;
10855 else if (strcasecmp (arg, "intel") == 0)
10856 intel_mnemonic = 1;
10857 else
10858 as_fatal (_("invalid -mmnemonic= option: `%s'"), arg);
10859 break;
10860
10861 case OPTION_MSYNTAX:
10862 if (strcasecmp (arg, "att") == 0)
10863 intel_syntax = 0;
10864 else if (strcasecmp (arg, "intel") == 0)
10865 intel_syntax = 1;
10866 else
10867 as_fatal (_("invalid -msyntax= option: `%s'"), arg);
10868 break;
10869
10870 case OPTION_MINDEX_REG:
10871 allow_index_reg = 1;
10872 break;
10873
10874 case OPTION_MNAKED_REG:
10875 allow_naked_reg = 1;
10876 break;
10877
10878 case OPTION_MSSE2AVX:
10879 sse2avx = 1;
10880 break;
10881
10882 case OPTION_MSSE_CHECK:
10883 if (strcasecmp (arg, "error") == 0)
10884 sse_check = check_error;
10885 else if (strcasecmp (arg, "warning") == 0)
10886 sse_check = check_warning;
10887 else if (strcasecmp (arg, "none") == 0)
10888 sse_check = check_none;
10889 else
10890 as_fatal (_("invalid -msse-check= option: `%s'"), arg);
10891 break;
10892
10893 case OPTION_MOPERAND_CHECK:
10894 if (strcasecmp (arg, "error") == 0)
10895 operand_check = check_error;
10896 else if (strcasecmp (arg, "warning") == 0)
10897 operand_check = check_warning;
10898 else if (strcasecmp (arg, "none") == 0)
10899 operand_check = check_none;
10900 else
10901 as_fatal (_("invalid -moperand-check= option: `%s'"), arg);
10902 break;
10903
10904 case OPTION_MAVXSCALAR:
10905 if (strcasecmp (arg, "128") == 0)
10906 avxscalar = vex128;
10907 else if (strcasecmp (arg, "256") == 0)
10908 avxscalar = vex256;
10909 else
10910 as_fatal (_("invalid -mavxscalar= option: `%s'"), arg);
10911 break;
10912
10913 case OPTION_MADD_BND_PREFIX:
10914 add_bnd_prefix = 1;
10915 break;
10916
10917 case OPTION_MEVEXLIG:
10918 if (strcmp (arg, "128") == 0)
10919 evexlig = evexl128;
10920 else if (strcmp (arg, "256") == 0)
10921 evexlig = evexl256;
10922 else if (strcmp (arg, "512") == 0)
10923 evexlig = evexl512;
10924 else
10925 as_fatal (_("invalid -mevexlig= option: `%s'"), arg);
10926 break;
10927
10928 case OPTION_MEVEXRCIG:
10929 if (strcmp (arg, "rne") == 0)
10930 evexrcig = rne;
10931 else if (strcmp (arg, "rd") == 0)
10932 evexrcig = rd;
10933 else if (strcmp (arg, "ru") == 0)
10934 evexrcig = ru;
10935 else if (strcmp (arg, "rz") == 0)
10936 evexrcig = rz;
10937 else
10938 as_fatal (_("invalid -mevexrcig= option: `%s'"), arg);
10939 break;
10940
10941 case OPTION_MEVEXWIG:
10942 if (strcmp (arg, "0") == 0)
10943 evexwig = evexw0;
10944 else if (strcmp (arg, "1") == 0)
10945 evexwig = evexw1;
10946 else
10947 as_fatal (_("invalid -mevexwig= option: `%s'"), arg);
10948 break;
10949
10950 # if defined (TE_PE) || defined (TE_PEP)
10951 case OPTION_MBIG_OBJ:
10952 use_big_obj = 1;
10953 break;
10954 #endif
10955
10956 case OPTION_MOMIT_LOCK_PREFIX:
10957 if (strcasecmp (arg, "yes") == 0)
10958 omit_lock_prefix = 1;
10959 else if (strcasecmp (arg, "no") == 0)
10960 omit_lock_prefix = 0;
10961 else
10962 as_fatal (_("invalid -momit-lock-prefix= option: `%s'"), arg);
10963 break;
10964
10965 case OPTION_MFENCE_AS_LOCK_ADD:
10966 if (strcasecmp (arg, "yes") == 0)
10967 avoid_fence = 1;
10968 else if (strcasecmp (arg, "no") == 0)
10969 avoid_fence = 0;
10970 else
10971 as_fatal (_("invalid -mfence-as-lock-add= option: `%s'"), arg);
10972 break;
10973
10974 case OPTION_MRELAX_RELOCATIONS:
10975 if (strcasecmp (arg, "yes") == 0)
10976 generate_relax_relocations = 1;
10977 else if (strcasecmp (arg, "no") == 0)
10978 generate_relax_relocations = 0;
10979 else
10980 as_fatal (_("invalid -mrelax-relocations= option: `%s'"), arg);
10981 break;
10982
10983 case OPTION_MAMD64:
10984 intel64 = 0;
10985 break;
10986
10987 case OPTION_MINTEL64:
10988 intel64 = 1;
10989 break;
10990
10991 case 'O':
10992 if (arg == NULL)
10993 {
10994 optimize = 1;
10995 /* Turn off -Os. */
10996 optimize_for_space = 0;
10997 }
10998 else if (*arg == 's')
10999 {
11000 optimize_for_space = 1;
11001 /* Turn on all encoding optimizations. */
11002 optimize = -1;
11003 }
11004 else
11005 {
11006 optimize = atoi (arg);
11007 /* Turn off -Os. */
11008 optimize_for_space = 0;
11009 }
11010 break;
11011
11012 default:
11013 return 0;
11014 }
11015 return 1;
11016 }
11017
11018 #define MESSAGE_TEMPLATE \
11019 " "
11020
11021 static char *
11022 output_message (FILE *stream, char *p, char *message, char *start,
11023 int *left_p, const char *name, int len)
11024 {
11025 int size = sizeof (MESSAGE_TEMPLATE);
11026 int left = *left_p;
11027
11028 /* Reserve 2 spaces for ", " or ",\0" */
11029 left -= len + 2;
11030
11031 /* Check if there is any room. */
11032 if (left >= 0)
11033 {
11034 if (p != start)
11035 {
11036 *p++ = ',';
11037 *p++ = ' ';
11038 }
11039 p = mempcpy (p, name, len);
11040 }
11041 else
11042 {
11043 /* Output the current message now and start a new one. */
11044 *p++ = ',';
11045 *p = '\0';
11046 fprintf (stream, "%s\n", message);
11047 p = start;
11048 left = size - (start - message) - len - 2;
11049
11050 gas_assert (left >= 0);
11051
11052 p = mempcpy (p, name, len);
11053 }
11054
11055 *left_p = left;
11056 return p;
11057 }
11058
11059 static void
11060 show_arch (FILE *stream, int ext, int check)
11061 {
11062 static char message[] = MESSAGE_TEMPLATE;
11063 char *start = message + 27;
11064 char *p;
11065 int size = sizeof (MESSAGE_TEMPLATE);
11066 int left;
11067 const char *name;
11068 int len;
11069 unsigned int j;
11070
11071 p = start;
11072 left = size - (start - message);
11073 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
11074 {
11075 /* Should it be skipped? */
11076 if (cpu_arch [j].skip)
11077 continue;
11078
11079 name = cpu_arch [j].name;
11080 len = cpu_arch [j].len;
11081 if (*name == '.')
11082 {
11083 /* It is an extension. Skip if we aren't asked to show it. */
11084 if (ext)
11085 {
11086 name++;
11087 len--;
11088 }
11089 else
11090 continue;
11091 }
11092 else if (ext)
11093 {
11094 /* It is an processor. Skip if we show only extension. */
11095 continue;
11096 }
11097 else if (check && ! cpu_arch[j].flags.bitfield.cpui386)
11098 {
11099 /* It is an impossible processor - skip. */
11100 continue;
11101 }
11102
11103 p = output_message (stream, p, message, start, &left, name, len);
11104 }
11105
11106 /* Display disabled extensions. */
11107 if (ext)
11108 for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
11109 {
11110 name = cpu_noarch [j].name;
11111 len = cpu_noarch [j].len;
11112 p = output_message (stream, p, message, start, &left, name,
11113 len);
11114 }
11115
11116 *p = '\0';
11117 fprintf (stream, "%s\n", message);
11118 }
11119
11120 void
11121 md_show_usage (FILE *stream)
11122 {
11123 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11124 fprintf (stream, _("\
11125 -Q ignored\n\
11126 -V print assembler version number\n\
11127 -k ignored\n"));
11128 #endif
11129 fprintf (stream, _("\
11130 -n Do not optimize code alignment\n\
11131 -q quieten some warnings\n"));
11132 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11133 fprintf (stream, _("\
11134 -s ignored\n"));
11135 #endif
11136 #if defined BFD64 && (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
11137 || defined (TE_PE) || defined (TE_PEP))
11138 fprintf (stream, _("\
11139 --32/--64/--x32 generate 32bit/64bit/x32 code\n"));
11140 #endif
11141 #ifdef SVR4_COMMENT_CHARS
11142 fprintf (stream, _("\
11143 --divide do not treat `/' as a comment character\n"));
11144 #else
11145 fprintf (stream, _("\
11146 --divide ignored\n"));
11147 #endif
11148 fprintf (stream, _("\
11149 -march=CPU[,+EXTENSION...]\n\
11150 generate code for CPU and EXTENSION, CPU is one of:\n"));
11151 show_arch (stream, 0, 1);
11152 fprintf (stream, _("\
11153 EXTENSION is combination of:\n"));
11154 show_arch (stream, 1, 0);
11155 fprintf (stream, _("\
11156 -mtune=CPU optimize for CPU, CPU is one of:\n"));
11157 show_arch (stream, 0, 0);
11158 fprintf (stream, _("\
11159 -msse2avx encode SSE instructions with VEX prefix\n"));
11160 fprintf (stream, _("\
11161 -msse-check=[none|error|warning] (default: warning)\n\
11162 check SSE instructions\n"));
11163 fprintf (stream, _("\
11164 -moperand-check=[none|error|warning] (default: warning)\n\
11165 check operand combinations for validity\n"));
11166 fprintf (stream, _("\
11167 -mavxscalar=[128|256] (default: 128)\n\
11168 encode scalar AVX instructions with specific vector\n\
11169 length\n"));
11170 fprintf (stream, _("\
11171 -mevexlig=[128|256|512] (default: 128)\n\
11172 encode scalar EVEX instructions with specific vector\n\
11173 length\n"));
11174 fprintf (stream, _("\
11175 -mevexwig=[0|1] (default: 0)\n\
11176 encode EVEX instructions with specific EVEX.W value\n\
11177 for EVEX.W bit ignored instructions\n"));
11178 fprintf (stream, _("\
11179 -mevexrcig=[rne|rd|ru|rz] (default: rne)\n\
11180 encode EVEX instructions with specific EVEX.RC value\n\
11181 for SAE-only ignored instructions\n"));
11182 fprintf (stream, _("\
11183 -mmnemonic=[att|intel] "));
11184 if (SYSV386_COMPAT)
11185 fprintf (stream, _("(default: att)\n"));
11186 else
11187 fprintf (stream, _("(default: intel)\n"));
11188 fprintf (stream, _("\
11189 use AT&T/Intel mnemonic\n"));
11190 fprintf (stream, _("\
11191 -msyntax=[att|intel] (default: att)\n\
11192 use AT&T/Intel syntax\n"));
11193 fprintf (stream, _("\
11194 -mindex-reg support pseudo index registers\n"));
11195 fprintf (stream, _("\
11196 -mnaked-reg don't require `%%' prefix for registers\n"));
11197 fprintf (stream, _("\
11198 -madd-bnd-prefix add BND prefix for all valid branches\n"));
11199 fprintf (stream, _("\
11200 -mshared disable branch optimization for shared code\n"));
11201 # if defined (TE_PE) || defined (TE_PEP)
11202 fprintf (stream, _("\
11203 -mbig-obj generate big object files\n"));
11204 #endif
11205 fprintf (stream, _("\
11206 -momit-lock-prefix=[no|yes] (default: no)\n\
11207 strip all lock prefixes\n"));
11208 fprintf (stream, _("\
11209 -mfence-as-lock-add=[no|yes] (default: no)\n\
11210 encode lfence, mfence and sfence as\n\
11211 lock addl $0x0, (%%{re}sp)\n"));
11212 fprintf (stream, _("\
11213 -mrelax-relocations=[no|yes] "));
11214 if (DEFAULT_GENERATE_X86_RELAX_RELOCATIONS)
11215 fprintf (stream, _("(default: yes)\n"));
11216 else
11217 fprintf (stream, _("(default: no)\n"));
11218 fprintf (stream, _("\
11219 generate relax relocations\n"));
11220 fprintf (stream, _("\
11221 -mamd64 accept only AMD64 ISA [default]\n"));
11222 fprintf (stream, _("\
11223 -mintel64 accept only Intel64 ISA\n"));
11224 }
11225
11226 #if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
11227 || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
11228 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
11229
11230 /* Pick the target format to use. */
11231
11232 const char *
11233 i386_target_format (void)
11234 {
11235 if (!strncmp (default_arch, "x86_64", 6))
11236 {
11237 update_code_flag (CODE_64BIT, 1);
11238 if (default_arch[6] == '\0')
11239 x86_elf_abi = X86_64_ABI;
11240 else
11241 x86_elf_abi = X86_64_X32_ABI;
11242 }
11243 else if (!strcmp (default_arch, "i386"))
11244 update_code_flag (CODE_32BIT, 1);
11245 else if (!strcmp (default_arch, "iamcu"))
11246 {
11247 update_code_flag (CODE_32BIT, 1);
11248 if (cpu_arch_isa == PROCESSOR_UNKNOWN)
11249 {
11250 static const i386_cpu_flags iamcu_flags = CPU_IAMCU_FLAGS;
11251 cpu_arch_name = "iamcu";
11252 cpu_sub_arch_name = NULL;
11253 cpu_arch_flags = iamcu_flags;
11254 cpu_arch_isa = PROCESSOR_IAMCU;
11255 cpu_arch_isa_flags = iamcu_flags;
11256 if (!cpu_arch_tune_set)
11257 {
11258 cpu_arch_tune = cpu_arch_isa;
11259 cpu_arch_tune_flags = cpu_arch_isa_flags;
11260 }
11261 }
11262 else if (cpu_arch_isa != PROCESSOR_IAMCU)
11263 as_fatal (_("Intel MCU doesn't support `%s' architecture"),
11264 cpu_arch_name);
11265 }
11266 else
11267 as_fatal (_("unknown architecture"));
11268
11269 if (cpu_flags_all_zero (&cpu_arch_isa_flags))
11270 cpu_arch_isa_flags = cpu_arch[flag_code == CODE_64BIT].flags;
11271 if (cpu_flags_all_zero (&cpu_arch_tune_flags))
11272 cpu_arch_tune_flags = cpu_arch[flag_code == CODE_64BIT].flags;
11273
11274 switch (OUTPUT_FLAVOR)
11275 {
11276 #if defined (OBJ_MAYBE_AOUT) || defined (OBJ_AOUT)
11277 case bfd_target_aout_flavour:
11278 return AOUT_TARGET_FORMAT;
11279 #endif
11280 #if defined (OBJ_MAYBE_COFF) || defined (OBJ_COFF)
11281 # if defined (TE_PE) || defined (TE_PEP)
11282 case bfd_target_coff_flavour:
11283 if (flag_code == CODE_64BIT)
11284 return use_big_obj ? "pe-bigobj-x86-64" : "pe-x86-64";
11285 else
11286 return "pe-i386";
11287 # elif defined (TE_GO32)
11288 case bfd_target_coff_flavour:
11289 return "coff-go32";
11290 # else
11291 case bfd_target_coff_flavour:
11292 return "coff-i386";
11293 # endif
11294 #endif
11295 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
11296 case bfd_target_elf_flavour:
11297 {
11298 const char *format;
11299
11300 switch (x86_elf_abi)
11301 {
11302 default:
11303 format = ELF_TARGET_FORMAT;
11304 break;
11305 case X86_64_ABI:
11306 use_rela_relocations = 1;
11307 object_64bit = 1;
11308 format = ELF_TARGET_FORMAT64;
11309 break;
11310 case X86_64_X32_ABI:
11311 use_rela_relocations = 1;
11312 object_64bit = 1;
11313 disallow_64bit_reloc = 1;
11314 format = ELF_TARGET_FORMAT32;
11315 break;
11316 }
11317 if (cpu_arch_isa == PROCESSOR_L1OM)
11318 {
11319 if (x86_elf_abi != X86_64_ABI)
11320 as_fatal (_("Intel L1OM is 64bit only"));
11321 return ELF_TARGET_L1OM_FORMAT;
11322 }
11323 else if (cpu_arch_isa == PROCESSOR_K1OM)
11324 {
11325 if (x86_elf_abi != X86_64_ABI)
11326 as_fatal (_("Intel K1OM is 64bit only"));
11327 return ELF_TARGET_K1OM_FORMAT;
11328 }
11329 else if (cpu_arch_isa == PROCESSOR_IAMCU)
11330 {
11331 if (x86_elf_abi != I386_ABI)
11332 as_fatal (_("Intel MCU is 32bit only"));
11333 return ELF_TARGET_IAMCU_FORMAT;
11334 }
11335 else
11336 return format;
11337 }
11338 #endif
11339 #if defined (OBJ_MACH_O)
11340 case bfd_target_mach_o_flavour:
11341 if (flag_code == CODE_64BIT)
11342 {
11343 use_rela_relocations = 1;
11344 object_64bit = 1;
11345 return "mach-o-x86-64";
11346 }
11347 else
11348 return "mach-o-i386";
11349 #endif
11350 default:
11351 abort ();
11352 return NULL;
11353 }
11354 }
11355
11356 #endif /* OBJ_MAYBE_ more than one */
11357 \f
11358 symbolS *
11359 md_undefined_symbol (char *name)
11360 {
11361 if (name[0] == GLOBAL_OFFSET_TABLE_NAME[0]
11362 && name[1] == GLOBAL_OFFSET_TABLE_NAME[1]
11363 && name[2] == GLOBAL_OFFSET_TABLE_NAME[2]
11364 && strcmp (name, GLOBAL_OFFSET_TABLE_NAME) == 0)
11365 {
11366 if (!GOT_symbol)
11367 {
11368 if (symbol_find (name))
11369 as_bad (_("GOT already in symbol table"));
11370 GOT_symbol = symbol_new (name, undefined_section,
11371 (valueT) 0, &zero_address_frag);
11372 };
11373 return GOT_symbol;
11374 }
11375 return 0;
11376 }
11377
11378 /* Round up a section size to the appropriate boundary. */
11379
11380 valueT
11381 md_section_align (segT segment ATTRIBUTE_UNUSED, valueT size)
11382 {
11383 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
11384 if (OUTPUT_FLAVOR == bfd_target_aout_flavour)
11385 {
11386 /* For a.out, force the section size to be aligned. If we don't do
11387 this, BFD will align it for us, but it will not write out the
11388 final bytes of the section. This may be a bug in BFD, but it is
11389 easier to fix it here since that is how the other a.out targets
11390 work. */
11391 int align;
11392
11393 align = bfd_get_section_alignment (stdoutput, segment);
11394 size = ((size + (1 << align) - 1) & (-((valueT) 1 << align)));
11395 }
11396 #endif
11397
11398 return size;
11399 }
11400
11401 /* On the i386, PC-relative offsets are relative to the start of the
11402 next instruction. That is, the address of the offset, plus its
11403 size, since the offset is always the last part of the insn. */
11404
11405 long
11406 md_pcrel_from (fixS *fixP)
11407 {
11408 return fixP->fx_size + fixP->fx_where + fixP->fx_frag->fr_address;
11409 }
11410
11411 #ifndef I386COFF
11412
11413 static void
11414 s_bss (int ignore ATTRIBUTE_UNUSED)
11415 {
11416 int temp;
11417
11418 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11419 if (IS_ELF)
11420 obj_elf_section_change_hook ();
11421 #endif
11422 temp = get_absolute_expression ();
11423 subseg_set (bss_section, (subsegT) temp);
11424 demand_empty_rest_of_line ();
11425 }
11426
11427 #endif
11428
11429 void
11430 i386_validate_fix (fixS *fixp)
11431 {
11432 if (fixp->fx_subsy)
11433 {
11434 if (fixp->fx_subsy == GOT_symbol)
11435 {
11436 if (fixp->fx_r_type == BFD_RELOC_32_PCREL)
11437 {
11438 if (!object_64bit)
11439 abort ();
11440 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11441 if (fixp->fx_tcbit2)
11442 fixp->fx_r_type = (fixp->fx_tcbit
11443 ? BFD_RELOC_X86_64_REX_GOTPCRELX
11444 : BFD_RELOC_X86_64_GOTPCRELX);
11445 else
11446 #endif
11447 fixp->fx_r_type = BFD_RELOC_X86_64_GOTPCREL;
11448 }
11449 else
11450 {
11451 if (!object_64bit)
11452 fixp->fx_r_type = BFD_RELOC_386_GOTOFF;
11453 else
11454 fixp->fx_r_type = BFD_RELOC_X86_64_GOTOFF64;
11455 }
11456 fixp->fx_subsy = 0;
11457 }
11458 }
11459 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11460 else if (!object_64bit)
11461 {
11462 if (fixp->fx_r_type == BFD_RELOC_386_GOT32
11463 && fixp->fx_tcbit2)
11464 fixp->fx_r_type = BFD_RELOC_386_GOT32X;
11465 }
11466 #endif
11467 }
11468
11469 arelent *
11470 tc_gen_reloc (asection *section ATTRIBUTE_UNUSED, fixS *fixp)
11471 {
11472 arelent *rel;
11473 bfd_reloc_code_real_type code;
11474
11475 switch (fixp->fx_r_type)
11476 {
11477 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11478 case BFD_RELOC_SIZE32:
11479 case BFD_RELOC_SIZE64:
11480 if (S_IS_DEFINED (fixp->fx_addsy)
11481 && !S_IS_EXTERNAL (fixp->fx_addsy))
11482 {
11483 /* Resolve size relocation against local symbol to size of
11484 the symbol plus addend. */
11485 valueT value = S_GET_SIZE (fixp->fx_addsy) + fixp->fx_offset;
11486 if (fixp->fx_r_type == BFD_RELOC_SIZE32
11487 && !fits_in_unsigned_long (value))
11488 as_bad_where (fixp->fx_file, fixp->fx_line,
11489 _("symbol size computation overflow"));
11490 fixp->fx_addsy = NULL;
11491 fixp->fx_subsy = NULL;
11492 md_apply_fix (fixp, (valueT *) &value, NULL);
11493 return NULL;
11494 }
11495 #endif
11496 /* Fall through. */
11497
11498 case BFD_RELOC_X86_64_PLT32:
11499 case BFD_RELOC_X86_64_GOT32:
11500 case BFD_RELOC_X86_64_GOTPCREL:
11501 case BFD_RELOC_X86_64_GOTPCRELX:
11502 case BFD_RELOC_X86_64_REX_GOTPCRELX:
11503 case BFD_RELOC_386_PLT32:
11504 case BFD_RELOC_386_GOT32:
11505 case BFD_RELOC_386_GOT32X:
11506 case BFD_RELOC_386_GOTOFF:
11507 case BFD_RELOC_386_GOTPC:
11508 case BFD_RELOC_386_TLS_GD:
11509 case BFD_RELOC_386_TLS_LDM:
11510 case BFD_RELOC_386_TLS_LDO_32:
11511 case BFD_RELOC_386_TLS_IE_32:
11512 case BFD_RELOC_386_TLS_IE:
11513 case BFD_RELOC_386_TLS_GOTIE:
11514 case BFD_RELOC_386_TLS_LE_32:
11515 case BFD_RELOC_386_TLS_LE:
11516 case BFD_RELOC_386_TLS_GOTDESC:
11517 case BFD_RELOC_386_TLS_DESC_CALL:
11518 case BFD_RELOC_X86_64_TLSGD:
11519 case BFD_RELOC_X86_64_TLSLD:
11520 case BFD_RELOC_X86_64_DTPOFF32:
11521 case BFD_RELOC_X86_64_DTPOFF64:
11522 case BFD_RELOC_X86_64_GOTTPOFF:
11523 case BFD_RELOC_X86_64_TPOFF32:
11524 case BFD_RELOC_X86_64_TPOFF64:
11525 case BFD_RELOC_X86_64_GOTOFF64:
11526 case BFD_RELOC_X86_64_GOTPC32:
11527 case BFD_RELOC_X86_64_GOT64:
11528 case BFD_RELOC_X86_64_GOTPCREL64:
11529 case BFD_RELOC_X86_64_GOTPC64:
11530 case BFD_RELOC_X86_64_GOTPLT64:
11531 case BFD_RELOC_X86_64_PLTOFF64:
11532 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
11533 case BFD_RELOC_X86_64_TLSDESC_CALL:
11534 case BFD_RELOC_RVA:
11535 case BFD_RELOC_VTABLE_ENTRY:
11536 case BFD_RELOC_VTABLE_INHERIT:
11537 #ifdef TE_PE
11538 case BFD_RELOC_32_SECREL:
11539 #endif
11540 code = fixp->fx_r_type;
11541 break;
11542 case BFD_RELOC_X86_64_32S:
11543 if (!fixp->fx_pcrel)
11544 {
11545 /* Don't turn BFD_RELOC_X86_64_32S into BFD_RELOC_32. */
11546 code = fixp->fx_r_type;
11547 break;
11548 }
11549 /* Fall through. */
11550 default:
11551 if (fixp->fx_pcrel)
11552 {
11553 switch (fixp->fx_size)
11554 {
11555 default:
11556 as_bad_where (fixp->fx_file, fixp->fx_line,
11557 _("can not do %d byte pc-relative relocation"),
11558 fixp->fx_size);
11559 code = BFD_RELOC_32_PCREL;
11560 break;
11561 case 1: code = BFD_RELOC_8_PCREL; break;
11562 case 2: code = BFD_RELOC_16_PCREL; break;
11563 case 4: code = BFD_RELOC_32_PCREL; break;
11564 #ifdef BFD64
11565 case 8: code = BFD_RELOC_64_PCREL; break;
11566 #endif
11567 }
11568 }
11569 else
11570 {
11571 switch (fixp->fx_size)
11572 {
11573 default:
11574 as_bad_where (fixp->fx_file, fixp->fx_line,
11575 _("can not do %d byte relocation"),
11576 fixp->fx_size);
11577 code = BFD_RELOC_32;
11578 break;
11579 case 1: code = BFD_RELOC_8; break;
11580 case 2: code = BFD_RELOC_16; break;
11581 case 4: code = BFD_RELOC_32; break;
11582 #ifdef BFD64
11583 case 8: code = BFD_RELOC_64; break;
11584 #endif
11585 }
11586 }
11587 break;
11588 }
11589
11590 if ((code == BFD_RELOC_32
11591 || code == BFD_RELOC_32_PCREL
11592 || code == BFD_RELOC_X86_64_32S)
11593 && GOT_symbol
11594 && fixp->fx_addsy == GOT_symbol)
11595 {
11596 if (!object_64bit)
11597 code = BFD_RELOC_386_GOTPC;
11598 else
11599 code = BFD_RELOC_X86_64_GOTPC32;
11600 }
11601 if ((code == BFD_RELOC_64 || code == BFD_RELOC_64_PCREL)
11602 && GOT_symbol
11603 && fixp->fx_addsy == GOT_symbol)
11604 {
11605 code = BFD_RELOC_X86_64_GOTPC64;
11606 }
11607
11608 rel = XNEW (arelent);
11609 rel->sym_ptr_ptr = XNEW (asymbol *);
11610 *rel->sym_ptr_ptr = symbol_get_bfdsym (fixp->fx_addsy);
11611
11612 rel->address = fixp->fx_frag->fr_address + fixp->fx_where;
11613
11614 if (!use_rela_relocations)
11615 {
11616 /* HACK: Since i386 ELF uses Rel instead of Rela, encode the
11617 vtable entry to be used in the relocation's section offset. */
11618 if (fixp->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
11619 rel->address = fixp->fx_offset;
11620 #if defined (OBJ_COFF) && defined (TE_PE)
11621 else if (fixp->fx_addsy && S_IS_WEAK (fixp->fx_addsy))
11622 rel->addend = fixp->fx_addnumber - (S_GET_VALUE (fixp->fx_addsy) * 2);
11623 else
11624 #endif
11625 rel->addend = 0;
11626 }
11627 /* Use the rela in 64bit mode. */
11628 else
11629 {
11630 if (disallow_64bit_reloc)
11631 switch (code)
11632 {
11633 case BFD_RELOC_X86_64_DTPOFF64:
11634 case BFD_RELOC_X86_64_TPOFF64:
11635 case BFD_RELOC_64_PCREL:
11636 case BFD_RELOC_X86_64_GOTOFF64:
11637 case BFD_RELOC_X86_64_GOT64:
11638 case BFD_RELOC_X86_64_GOTPCREL64:
11639 case BFD_RELOC_X86_64_GOTPC64:
11640 case BFD_RELOC_X86_64_GOTPLT64:
11641 case BFD_RELOC_X86_64_PLTOFF64:
11642 as_bad_where (fixp->fx_file, fixp->fx_line,
11643 _("cannot represent relocation type %s in x32 mode"),
11644 bfd_get_reloc_code_name (code));
11645 break;
11646 default:
11647 break;
11648 }
11649
11650 if (!fixp->fx_pcrel)
11651 rel->addend = fixp->fx_offset;
11652 else
11653 switch (code)
11654 {
11655 case BFD_RELOC_X86_64_PLT32:
11656 case BFD_RELOC_X86_64_GOT32:
11657 case BFD_RELOC_X86_64_GOTPCREL:
11658 case BFD_RELOC_X86_64_GOTPCRELX:
11659 case BFD_RELOC_X86_64_REX_GOTPCRELX:
11660 case BFD_RELOC_X86_64_TLSGD:
11661 case BFD_RELOC_X86_64_TLSLD:
11662 case BFD_RELOC_X86_64_GOTTPOFF:
11663 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
11664 case BFD_RELOC_X86_64_TLSDESC_CALL:
11665 rel->addend = fixp->fx_offset - fixp->fx_size;
11666 break;
11667 default:
11668 rel->addend = (section->vma
11669 - fixp->fx_size
11670 + fixp->fx_addnumber
11671 + md_pcrel_from (fixp));
11672 break;
11673 }
11674 }
11675
11676 rel->howto = bfd_reloc_type_lookup (stdoutput, code);
11677 if (rel->howto == NULL)
11678 {
11679 as_bad_where (fixp->fx_file, fixp->fx_line,
11680 _("cannot represent relocation type %s"),
11681 bfd_get_reloc_code_name (code));
11682 /* Set howto to a garbage value so that we can keep going. */
11683 rel->howto = bfd_reloc_type_lookup (stdoutput, BFD_RELOC_32);
11684 gas_assert (rel->howto != NULL);
11685 }
11686
11687 return rel;
11688 }
11689
11690 #include "tc-i386-intel.c"
11691
11692 void
11693 tc_x86_parse_to_dw2regnum (expressionS *exp)
11694 {
11695 int saved_naked_reg;
11696 char saved_register_dot;
11697
11698 saved_naked_reg = allow_naked_reg;
11699 allow_naked_reg = 1;
11700 saved_register_dot = register_chars['.'];
11701 register_chars['.'] = '.';
11702 allow_pseudo_reg = 1;
11703 expression_and_evaluate (exp);
11704 allow_pseudo_reg = 0;
11705 register_chars['.'] = saved_register_dot;
11706 allow_naked_reg = saved_naked_reg;
11707
11708 if (exp->X_op == O_register && exp->X_add_number >= 0)
11709 {
11710 if ((addressT) exp->X_add_number < i386_regtab_size)
11711 {
11712 exp->X_op = O_constant;
11713 exp->X_add_number = i386_regtab[exp->X_add_number]
11714 .dw2_regnum[flag_code >> 1];
11715 }
11716 else
11717 exp->X_op = O_illegal;
11718 }
11719 }
11720
11721 void
11722 tc_x86_frame_initial_instructions (void)
11723 {
11724 static unsigned int sp_regno[2];
11725
11726 if (!sp_regno[flag_code >> 1])
11727 {
11728 char *saved_input = input_line_pointer;
11729 char sp[][4] = {"esp", "rsp"};
11730 expressionS exp;
11731
11732 input_line_pointer = sp[flag_code >> 1];
11733 tc_x86_parse_to_dw2regnum (&exp);
11734 gas_assert (exp.X_op == O_constant);
11735 sp_regno[flag_code >> 1] = exp.X_add_number;
11736 input_line_pointer = saved_input;
11737 }
11738
11739 cfi_add_CFA_def_cfa (sp_regno[flag_code >> 1], -x86_cie_data_alignment);
11740 cfi_add_CFA_offset (x86_dwarf2_return_column, x86_cie_data_alignment);
11741 }
11742
11743 int
11744 x86_dwarf2_addr_size (void)
11745 {
11746 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
11747 if (x86_elf_abi == X86_64_X32_ABI)
11748 return 4;
11749 #endif
11750 return bfd_arch_bits_per_address (stdoutput) / 8;
11751 }
11752
11753 int
11754 i386_elf_section_type (const char *str, size_t len)
11755 {
11756 if (flag_code == CODE_64BIT
11757 && len == sizeof ("unwind") - 1
11758 && strncmp (str, "unwind", 6) == 0)
11759 return SHT_X86_64_UNWIND;
11760
11761 return -1;
11762 }
11763
11764 #ifdef TE_SOLARIS
11765 void
11766 i386_solaris_fix_up_eh_frame (segT sec)
11767 {
11768 if (flag_code == CODE_64BIT)
11769 elf_section_type (sec) = SHT_X86_64_UNWIND;
11770 }
11771 #endif
11772
11773 #ifdef TE_PE
11774 void
11775 tc_pe_dwarf2_emit_offset (symbolS *symbol, unsigned int size)
11776 {
11777 expressionS exp;
11778
11779 exp.X_op = O_secrel;
11780 exp.X_add_symbol = symbol;
11781 exp.X_add_number = 0;
11782 emit_expr (&exp, size);
11783 }
11784 #endif
11785
11786 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11787 /* For ELF on x86-64, add support for SHF_X86_64_LARGE. */
11788
11789 bfd_vma
11790 x86_64_section_letter (int letter, const char **ptr_msg)
11791 {
11792 if (flag_code == CODE_64BIT)
11793 {
11794 if (letter == 'l')
11795 return SHF_X86_64_LARGE;
11796
11797 *ptr_msg = _("bad .section directive: want a,l,w,x,M,S,G,T in string");
11798 }
11799 else
11800 *ptr_msg = _("bad .section directive: want a,w,x,M,S,G,T in string");
11801 return -1;
11802 }
11803
11804 bfd_vma
11805 x86_64_section_word (char *str, size_t len)
11806 {
11807 if (len == 5 && flag_code == CODE_64BIT && CONST_STRNEQ (str, "large"))
11808 return SHF_X86_64_LARGE;
11809
11810 return -1;
11811 }
11812
11813 static void
11814 handle_large_common (int small ATTRIBUTE_UNUSED)
11815 {
11816 if (flag_code != CODE_64BIT)
11817 {
11818 s_comm_internal (0, elf_common_parse);
11819 as_warn (_(".largecomm supported only in 64bit mode, producing .comm"));
11820 }
11821 else
11822 {
11823 static segT lbss_section;
11824 asection *saved_com_section_ptr = elf_com_section_ptr;
11825 asection *saved_bss_section = bss_section;
11826
11827 if (lbss_section == NULL)
11828 {
11829 flagword applicable;
11830 segT seg = now_seg;
11831 subsegT subseg = now_subseg;
11832
11833 /* The .lbss section is for local .largecomm symbols. */
11834 lbss_section = subseg_new (".lbss", 0);
11835 applicable = bfd_applicable_section_flags (stdoutput);
11836 bfd_set_section_flags (stdoutput, lbss_section,
11837 applicable & SEC_ALLOC);
11838 seg_info (lbss_section)->bss = 1;
11839
11840 subseg_set (seg, subseg);
11841 }
11842
11843 elf_com_section_ptr = &_bfd_elf_large_com_section;
11844 bss_section = lbss_section;
11845
11846 s_comm_internal (0, elf_common_parse);
11847
11848 elf_com_section_ptr = saved_com_section_ptr;
11849 bss_section = saved_bss_section;
11850 }
11851 }
11852 #endif /* OBJ_ELF || OBJ_MAYBE_ELF */