]> git.ipfire.org Git - thirdparty/binutils-gdb.git/blob - gas/config/tc-riscv.c
RISC-V: Compress 3-operand beq/bne against x0.
[thirdparty/binutils-gdb.git] / gas / config / tc-riscv.c
1 /* tc-riscv.c -- RISC-V assembler
2 Copyright (C) 2011-2019 Free Software Foundation, Inc.
3
4 Contributed by Andrew Waterman (andrew@sifive.com).
5 Based on MIPS target.
6
7 This file is part of GAS.
8
9 GAS is free software; you can redistribute it and/or modify
10 it under the terms of the GNU General Public License as published by
11 the Free Software Foundation; either version 3, or (at your option)
12 any later version.
13
14 GAS is distributed in the hope that it will be useful,
15 but WITHOUT ANY WARRANTY; without even the implied warranty of
16 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
17 GNU General Public License for more details.
18
19 You should have received a copy of the GNU General Public License
20 along with this program; see the file COPYING3. If not,
21 see <http://www.gnu.org/licenses/>. */
22
23 #include "as.h"
24 #include "config.h"
25 #include "subsegs.h"
26 #include "safe-ctype.h"
27
28 #include "itbl-ops.h"
29 #include "dwarf2dbg.h"
30 #include "dw2gencfi.h"
31
32 #include "bfd/elfxx-riscv.h"
33 #include "elf/riscv.h"
34 #include "opcode/riscv.h"
35
36 #include <stdint.h>
37
38 /* Information about an instruction, including its format, operands
39 and fixups. */
40 struct riscv_cl_insn
41 {
42 /* The opcode's entry in riscv_opcodes. */
43 const struct riscv_opcode *insn_mo;
44
45 /* The encoded instruction bits. */
46 insn_t insn_opcode;
47
48 /* The frag that contains the instruction. */
49 struct frag *frag;
50
51 /* The offset into FRAG of the first instruction byte. */
52 long where;
53
54 /* The relocs associated with the instruction, if any. */
55 fixS *fixp;
56 };
57
58 #ifndef DEFAULT_ARCH
59 #define DEFAULT_ARCH "riscv64"
60 #endif
61
62 #ifndef DEFAULT_RISCV_ATTR
63 #define DEFAULT_RISCV_ATTR 0
64 #endif
65
66 static const char default_arch[] = DEFAULT_ARCH;
67
68 static unsigned xlen = 0; /* width of an x-register */
69 static unsigned abi_xlen = 0; /* width of a pointer in the ABI */
70 static bfd_boolean rve_abi = FALSE;
71
72 #define LOAD_ADDRESS_INSN (abi_xlen == 64 ? "ld" : "lw")
73 #define ADD32_INSN (xlen == 64 ? "addiw" : "addi")
74
75 static unsigned elf_flags = 0;
76
77 /* This is the set of options which the .option pseudo-op may modify. */
78
79 struct riscv_set_options
80 {
81 int pic; /* Generate position-independent code. */
82 int rvc; /* Generate RVC code. */
83 int rve; /* Generate RVE code. */
84 int relax; /* Emit relocs the linker is allowed to relax. */
85 int arch_attr; /* Emit arch attribute. */
86 };
87
88 static struct riscv_set_options riscv_opts =
89 {
90 0, /* pic */
91 0, /* rvc */
92 0, /* rve */
93 1, /* relax */
94 DEFAULT_RISCV_ATTR, /* arch_attr */
95 };
96
97 static void
98 riscv_set_rvc (bfd_boolean rvc_value)
99 {
100 if (rvc_value)
101 elf_flags |= EF_RISCV_RVC;
102
103 riscv_opts.rvc = rvc_value;
104 }
105
106 static void
107 riscv_set_rve (bfd_boolean rve_value)
108 {
109 riscv_opts.rve = rve_value;
110 }
111
112 static riscv_subset_list_t riscv_subsets;
113
114 static bfd_boolean
115 riscv_subset_supports (const char *feature)
116 {
117 if (riscv_opts.rvc && (strcasecmp (feature, "c") == 0))
118 return TRUE;
119
120 return riscv_lookup_subset (&riscv_subsets, feature) != NULL;
121 }
122
123 static bfd_boolean
124 riscv_multi_subset_supports (const char *features[])
125 {
126 unsigned i = 0;
127 bfd_boolean supported = TRUE;
128
129 for (;features[i]; ++i)
130 supported = supported && riscv_subset_supports (features[i]);
131
132 return supported;
133 }
134
135 /* Set which ISA and extensions are available. */
136
137 static void
138 riscv_set_arch (const char *s)
139 {
140 riscv_parse_subset_t rps;
141 rps.subset_list = &riscv_subsets;
142 rps.error_handler = as_fatal;
143 rps.xlen = &xlen;
144
145 riscv_release_subset_list (&riscv_subsets);
146 riscv_parse_subset (&rps, s);
147 }
148
149 /* Handle of the OPCODE hash table. */
150 static struct hash_control *op_hash = NULL;
151
152 /* Handle of the type of .insn hash table. */
153 static struct hash_control *insn_type_hash = NULL;
154
155 /* This array holds the chars that always start a comment. If the
156 pre-processor is disabled, these aren't very useful */
157 const char comment_chars[] = "#";
158
159 /* This array holds the chars that only start a comment at the beginning of
160 a line. If the line seems to have the form '# 123 filename'
161 .line and .file directives will appear in the pre-processed output */
162 /* Note that input_file.c hand checks for '#' at the beginning of the
163 first line of the input file. This is because the compiler outputs
164 #NO_APP at the beginning of its output. */
165 /* Also note that C style comments are always supported. */
166 const char line_comment_chars[] = "#";
167
168 /* This array holds machine specific line separator characters. */
169 const char line_separator_chars[] = ";";
170
171 /* Chars that can be used to separate mant from exp in floating point nums */
172 const char EXP_CHARS[] = "eE";
173
174 /* Chars that mean this number is a floating point constant */
175 /* As in 0f12.456 */
176 /* or 0d1.2345e12 */
177 const char FLT_CHARS[] = "rRsSfFdDxXpP";
178
179 /* Indicate we are already assemble any instructions or not. */
180 static bfd_boolean start_assemble = FALSE;
181
182 /* Indicate arch attribute is explictly set. */
183 static bfd_boolean explicit_arch_attr = FALSE;
184
185 /* Macros for encoding relaxation state for RVC branches and far jumps. */
186 #define RELAX_BRANCH_ENCODE(uncond, rvc, length) \
187 ((relax_substateT) \
188 (0xc0000000 \
189 | ((uncond) ? 1 : 0) \
190 | ((rvc) ? 2 : 0) \
191 | ((length) << 2)))
192 #define RELAX_BRANCH_P(i) (((i) & 0xf0000000) == 0xc0000000)
193 #define RELAX_BRANCH_LENGTH(i) (((i) >> 2) & 0xF)
194 #define RELAX_BRANCH_RVC(i) (((i) & 2) != 0)
195 #define RELAX_BRANCH_UNCOND(i) (((i) & 1) != 0)
196
197 /* Is the given value a sign-extended 32-bit value? */
198 #define IS_SEXT_32BIT_NUM(x) \
199 (((x) &~ (offsetT) 0x7fffffff) == 0 \
200 || (((x) &~ (offsetT) 0x7fffffff) == ~ (offsetT) 0x7fffffff))
201
202 /* Is the given value a zero-extended 32-bit value? Or a negated one? */
203 #define IS_ZEXT_32BIT_NUM(x) \
204 (((x) &~ (offsetT) 0xffffffff) == 0 \
205 || (((x) &~ (offsetT) 0xffffffff) == ~ (offsetT) 0xffffffff))
206
207 /* Change INSN's opcode so that the operand given by FIELD has value VALUE.
208 INSN is a riscv_cl_insn structure and VALUE is evaluated exactly once. */
209 #define INSERT_OPERAND(FIELD, INSN, VALUE) \
210 INSERT_BITS ((INSN).insn_opcode, VALUE, OP_MASK_##FIELD, OP_SH_##FIELD)
211
212 /* Determine if an instruction matches an opcode. */
213 #define OPCODE_MATCHES(OPCODE, OP) \
214 (((OPCODE) & MASK_##OP) == MATCH_##OP)
215
216 static char *expr_end;
217
218 /* The default target format to use. */
219
220 const char *
221 riscv_target_format (void)
222 {
223 return xlen == 64 ? "elf64-littleriscv" : "elf32-littleriscv";
224 }
225
226 /* Return the length of instruction INSN. */
227
228 static inline unsigned int
229 insn_length (const struct riscv_cl_insn *insn)
230 {
231 return riscv_insn_length (insn->insn_opcode);
232 }
233
234 /* Initialise INSN from opcode entry MO. Leave its position unspecified. */
235
236 static void
237 create_insn (struct riscv_cl_insn *insn, const struct riscv_opcode *mo)
238 {
239 insn->insn_mo = mo;
240 insn->insn_opcode = mo->match;
241 insn->frag = NULL;
242 insn->where = 0;
243 insn->fixp = NULL;
244 }
245
246 /* Install INSN at the location specified by its "frag" and "where" fields. */
247
248 static void
249 install_insn (const struct riscv_cl_insn *insn)
250 {
251 char *f = insn->frag->fr_literal + insn->where;
252 md_number_to_chars (f, insn->insn_opcode, insn_length (insn));
253 }
254
255 /* Move INSN to offset WHERE in FRAG. Adjust the fixups accordingly
256 and install the opcode in the new location. */
257
258 static void
259 move_insn (struct riscv_cl_insn *insn, fragS *frag, long where)
260 {
261 insn->frag = frag;
262 insn->where = where;
263 if (insn->fixp != NULL)
264 {
265 insn->fixp->fx_frag = frag;
266 insn->fixp->fx_where = where;
267 }
268 install_insn (insn);
269 }
270
271 /* Add INSN to the end of the output. */
272
273 static void
274 add_fixed_insn (struct riscv_cl_insn *insn)
275 {
276 char *f = frag_more (insn_length (insn));
277 move_insn (insn, frag_now, f - frag_now->fr_literal);
278 }
279
280 static void
281 add_relaxed_insn (struct riscv_cl_insn *insn, int max_chars, int var,
282 relax_substateT subtype, symbolS *symbol, offsetT offset)
283 {
284 frag_grow (max_chars);
285 move_insn (insn, frag_now, frag_more (0) - frag_now->fr_literal);
286 frag_var (rs_machine_dependent, max_chars, var,
287 subtype, symbol, offset, NULL);
288 }
289
290 /* Compute the length of a branch sequence, and adjust the stored length
291 accordingly. If FRAGP is NULL, the worst-case length is returned. */
292
293 static unsigned
294 relaxed_branch_length (fragS *fragp, asection *sec, int update)
295 {
296 int jump, rvc, length = 8;
297
298 if (!fragp)
299 return length;
300
301 jump = RELAX_BRANCH_UNCOND (fragp->fr_subtype);
302 rvc = RELAX_BRANCH_RVC (fragp->fr_subtype);
303 length = RELAX_BRANCH_LENGTH (fragp->fr_subtype);
304
305 /* Assume jumps are in range; the linker will catch any that aren't. */
306 length = jump ? 4 : 8;
307
308 if (fragp->fr_symbol != NULL
309 && S_IS_DEFINED (fragp->fr_symbol)
310 && !S_IS_WEAK (fragp->fr_symbol)
311 && sec == S_GET_SEGMENT (fragp->fr_symbol))
312 {
313 offsetT val = S_GET_VALUE (fragp->fr_symbol) + fragp->fr_offset;
314 bfd_vma rvc_range = jump ? RVC_JUMP_REACH : RVC_BRANCH_REACH;
315 val -= fragp->fr_address + fragp->fr_fix;
316
317 if (rvc && (bfd_vma)(val + rvc_range/2) < rvc_range)
318 length = 2;
319 else if ((bfd_vma)(val + RISCV_BRANCH_REACH/2) < RISCV_BRANCH_REACH)
320 length = 4;
321 else if (!jump && rvc)
322 length = 6;
323 }
324
325 if (update)
326 fragp->fr_subtype = RELAX_BRANCH_ENCODE (jump, rvc, length);
327
328 return length;
329 }
330
331 /* Information about an opcode name, mnemonics and its value. */
332 struct opcode_name_t
333 {
334 const char *name;
335 unsigned int val;
336 };
337
338 /* List for all supported opcode name. */
339 static const struct opcode_name_t opcode_name_list[] =
340 {
341 {"C0", 0x0},
342 {"C1", 0x1},
343 {"C2", 0x2},
344
345 {"LOAD", 0x03},
346 {"LOAD_FP", 0x07},
347 {"CUSTOM_0", 0x0b},
348 {"MISC_MEM", 0x0f},
349 {"OP_IMM", 0x13},
350 {"AUIPC", 0x17},
351 {"OP_IMM_32", 0x1b},
352 /* 48b 0x1f. */
353
354 {"STORE", 0x23},
355 {"STORE_FP", 0x27},
356 {"CUSTOM_1", 0x2b},
357 {"AMO", 0x2f},
358 {"OP", 0x33},
359 {"LUI", 0x37},
360 {"OP_32", 0x3b},
361 /* 64b 0x3f. */
362
363 {"MADD", 0x43},
364 {"MSUB", 0x47},
365 {"NMADD", 0x4f},
366 {"NMSUB", 0x4b},
367 {"OP_FP", 0x53},
368 /*reserved 0x57. */
369 {"CUSTOM_2", 0x5b},
370 /* 48b 0x5f. */
371
372 {"BRANCH", 0x63},
373 {"JALR", 0x67},
374 /*reserved 0x5b. */
375 {"JAL", 0x6f},
376 {"SYSTEM", 0x73},
377 /*reserved 0x77. */
378 {"CUSTOM_3", 0x7b},
379 /* >80b 0x7f. */
380
381 {NULL, 0}
382 };
383
384 /* Hash table for lookup opcode name. */
385 static struct hash_control *opcode_names_hash = NULL;
386
387 /* Initialization for hash table of opcode name. */
388 static void
389 init_opcode_names_hash (void)
390 {
391 const char *retval;
392 const struct opcode_name_t *opcode;
393
394 for (opcode = &opcode_name_list[0]; opcode->name != NULL; ++opcode)
395 {
396 retval = hash_insert (opcode_names_hash, opcode->name, (void *)opcode);
397
398 if (retval != NULL)
399 as_fatal (_("internal error: can't hash `%s': %s"),
400 opcode->name, retval);
401 }
402 }
403
404 /* Find `s` is a valid opcode name or not,
405 return the opcode name info if found. */
406 static const struct opcode_name_t *
407 opcode_name_lookup (char **s)
408 {
409 char *e;
410 char save_c;
411 struct opcode_name_t *o;
412
413 /* Find end of name. */
414 e = *s;
415 if (is_name_beginner (*e))
416 ++e;
417 while (is_part_of_name (*e))
418 ++e;
419
420 /* Terminate name. */
421 save_c = *e;
422 *e = '\0';
423
424 o = (struct opcode_name_t *) hash_find (opcode_names_hash, *s);
425
426 /* Advance to next token if one was recognized. */
427 if (o)
428 *s = e;
429
430 *e = save_c;
431 expr_end = e;
432
433 return o;
434 }
435
436 struct regname
437 {
438 const char *name;
439 unsigned int num;
440 };
441
442 enum reg_class
443 {
444 RCLASS_GPR,
445 RCLASS_FPR,
446 RCLASS_CSR,
447 RCLASS_MAX
448 };
449
450 static struct hash_control *reg_names_hash = NULL;
451
452 #define ENCODE_REG_HASH(cls, n) \
453 ((void *)(uintptr_t)((n) * RCLASS_MAX + (cls) + 1))
454 #define DECODE_REG_CLASS(hash) (((uintptr_t)(hash) - 1) % RCLASS_MAX)
455 #define DECODE_REG_NUM(hash) (((uintptr_t)(hash) - 1) / RCLASS_MAX)
456
457 static void
458 hash_reg_name (enum reg_class class, const char *name, unsigned n)
459 {
460 void *hash = ENCODE_REG_HASH (class, n);
461 const char *retval = hash_insert (reg_names_hash, name, hash);
462
463 if (retval != NULL)
464 as_fatal (_("internal error: can't hash `%s': %s"), name, retval);
465 }
466
467 static void
468 hash_reg_names (enum reg_class class, const char * const names[], unsigned n)
469 {
470 unsigned i;
471
472 for (i = 0; i < n; i++)
473 hash_reg_name (class, names[i], i);
474 }
475
476 static unsigned int
477 reg_lookup_internal (const char *s, enum reg_class class)
478 {
479 struct regname *r = (struct regname *) hash_find (reg_names_hash, s);
480
481 if (r == NULL || DECODE_REG_CLASS (r) != class)
482 return -1;
483
484 if (riscv_opts.rve && class == RCLASS_GPR && DECODE_REG_NUM (r) > 15)
485 return -1;
486
487 return DECODE_REG_NUM (r);
488 }
489
490 static bfd_boolean
491 reg_lookup (char **s, enum reg_class class, unsigned int *regnop)
492 {
493 char *e;
494 char save_c;
495 int reg = -1;
496
497 /* Find end of name. */
498 e = *s;
499 if (is_name_beginner (*e))
500 ++e;
501 while (is_part_of_name (*e))
502 ++e;
503
504 /* Terminate name. */
505 save_c = *e;
506 *e = '\0';
507
508 /* Look for the register. Advance to next token if one was recognized. */
509 if ((reg = reg_lookup_internal (*s, class)) >= 0)
510 *s = e;
511
512 *e = save_c;
513 if (regnop)
514 *regnop = reg;
515 return reg >= 0;
516 }
517
518 static bfd_boolean
519 arg_lookup (char **s, const char *const *array, size_t size, unsigned *regnop)
520 {
521 const char *p = strchr (*s, ',');
522 size_t i, len = p ? (size_t)(p - *s) : strlen (*s);
523
524 if (len == 0)
525 return FALSE;
526
527 for (i = 0; i < size; i++)
528 if (array[i] != NULL && strncmp (array[i], *s, len) == 0)
529 {
530 *regnop = i;
531 *s += len;
532 return TRUE;
533 }
534
535 return FALSE;
536 }
537
538 /* For consistency checking, verify that all bits are specified either
539 by the match/mask part of the instruction definition, or by the
540 operand list.
541
542 `length` could be 0, 4 or 8, 0 for auto detection. */
543 static bfd_boolean
544 validate_riscv_insn (const struct riscv_opcode *opc, int length)
545 {
546 const char *p = opc->args;
547 char c;
548 insn_t used_bits = opc->mask;
549 int insn_width;
550 insn_t required_bits;
551
552 if (length == 0)
553 insn_width = 8 * riscv_insn_length (opc->match);
554 else
555 insn_width = 8 * length;
556
557 required_bits = ~0ULL >> (64 - insn_width);
558
559 if ((used_bits & opc->match) != (opc->match & required_bits))
560 {
561 as_bad (_("internal: bad RISC-V opcode (mask error): %s %s"),
562 opc->name, opc->args);
563 return FALSE;
564 }
565
566 #define USE_BITS(mask,shift) (used_bits |= ((insn_t)(mask) << (shift)))
567 while (*p)
568 switch (c = *p++)
569 {
570 case 'C': /* RVC */
571 switch (c = *p++)
572 {
573 case 'a': used_bits |= ENCODE_RVC_J_IMM (-1U); break;
574 case 'c': break; /* RS1, constrained to equal sp */
575 case 'i': used_bits |= ENCODE_RVC_SIMM3(-1U); break;
576 case 'j': used_bits |= ENCODE_RVC_IMM (-1U); break;
577 case 'o': used_bits |= ENCODE_RVC_IMM (-1U); break;
578 case 'k': used_bits |= ENCODE_RVC_LW_IMM (-1U); break;
579 case 'l': used_bits |= ENCODE_RVC_LD_IMM (-1U); break;
580 case 'm': used_bits |= ENCODE_RVC_LWSP_IMM (-1U); break;
581 case 'n': used_bits |= ENCODE_RVC_LDSP_IMM (-1U); break;
582 case 'p': used_bits |= ENCODE_RVC_B_IMM (-1U); break;
583 case 's': USE_BITS (OP_MASK_CRS1S, OP_SH_CRS1S); break;
584 case 't': USE_BITS (OP_MASK_CRS2S, OP_SH_CRS2S); break;
585 case 'u': used_bits |= ENCODE_RVC_IMM (-1U); break;
586 case 'v': used_bits |= ENCODE_RVC_IMM (-1U); break;
587 case 'w': break; /* RS1S, constrained to equal RD */
588 case 'x': break; /* RS2S, constrained to equal RD */
589 case 'z': break; /* RS2S, contrained to be x0 */
590 case 'K': used_bits |= ENCODE_RVC_ADDI4SPN_IMM (-1U); break;
591 case 'L': used_bits |= ENCODE_RVC_ADDI16SP_IMM (-1U); break;
592 case 'M': used_bits |= ENCODE_RVC_SWSP_IMM (-1U); break;
593 case 'N': used_bits |= ENCODE_RVC_SDSP_IMM (-1U); break;
594 case 'U': break; /* RS1, constrained to equal RD */
595 case 'V': USE_BITS (OP_MASK_CRS2, OP_SH_CRS2); break;
596 case '<': used_bits |= ENCODE_RVC_IMM (-1U); break;
597 case '>': used_bits |= ENCODE_RVC_IMM (-1U); break;
598 case '8': used_bits |= ENCODE_RVC_UIMM8 (-1U); break;
599 case 'S': USE_BITS (OP_MASK_CRS1S, OP_SH_CRS1S); break;
600 case 'T': USE_BITS (OP_MASK_CRS2, OP_SH_CRS2); break;
601 case 'D': USE_BITS (OP_MASK_CRS2S, OP_SH_CRS2S); break;
602 case 'F': /* funct */
603 switch (c = *p++)
604 {
605 case '6': USE_BITS (OP_MASK_CFUNCT6, OP_SH_CFUNCT6); break;
606 case '4': USE_BITS (OP_MASK_CFUNCT4, OP_SH_CFUNCT4); break;
607 case '3': USE_BITS (OP_MASK_CFUNCT3, OP_SH_CFUNCT3); break;
608 case '2': USE_BITS (OP_MASK_CFUNCT2, OP_SH_CFUNCT2); break;
609 default:
610 as_bad (_("internal: bad RISC-V opcode"
611 " (unknown operand type `CF%c'): %s %s"),
612 c, opc->name, opc->args);
613 return FALSE;
614 }
615 break;
616 default:
617 as_bad (_("internal: bad RISC-V opcode (unknown operand type `C%c'): %s %s"),
618 c, opc->name, opc->args);
619 return FALSE;
620 }
621 break;
622 case ',': break;
623 case '(': break;
624 case ')': break;
625 case '<': USE_BITS (OP_MASK_SHAMTW, OP_SH_SHAMTW); break;
626 case '>': USE_BITS (OP_MASK_SHAMT, OP_SH_SHAMT); break;
627 case 'A': break;
628 case 'D': USE_BITS (OP_MASK_RD, OP_SH_RD); break;
629 case 'Z': USE_BITS (OP_MASK_RS1, OP_SH_RS1); break;
630 case 'E': USE_BITS (OP_MASK_CSR, OP_SH_CSR); break;
631 case 'I': break;
632 case 'R': USE_BITS (OP_MASK_RS3, OP_SH_RS3); break;
633 case 'S': USE_BITS (OP_MASK_RS1, OP_SH_RS1); break;
634 case 'U': USE_BITS (OP_MASK_RS1, OP_SH_RS1); /* fallthru */
635 case 'T': USE_BITS (OP_MASK_RS2, OP_SH_RS2); break;
636 case 'd': USE_BITS (OP_MASK_RD, OP_SH_RD); break;
637 case 'm': USE_BITS (OP_MASK_RM, OP_SH_RM); break;
638 case 's': USE_BITS (OP_MASK_RS1, OP_SH_RS1); break;
639 case 't': USE_BITS (OP_MASK_RS2, OP_SH_RS2); break;
640 case 'r': USE_BITS (OP_MASK_RS3, OP_SH_RS3); break;
641 case 'P': USE_BITS (OP_MASK_PRED, OP_SH_PRED); break;
642 case 'Q': USE_BITS (OP_MASK_SUCC, OP_SH_SUCC); break;
643 case 'o':
644 case 'j': used_bits |= ENCODE_ITYPE_IMM (-1U); break;
645 case 'a': used_bits |= ENCODE_UJTYPE_IMM (-1U); break;
646 case 'p': used_bits |= ENCODE_SBTYPE_IMM (-1U); break;
647 case 'q': used_bits |= ENCODE_STYPE_IMM (-1U); break;
648 case 'u': used_bits |= ENCODE_UTYPE_IMM (-1U); break;
649 case 'z': break;
650 case '[': break;
651 case ']': break;
652 case '0': break;
653 case '1': break;
654 case 'F': /* funct */
655 switch (c = *p++)
656 {
657 case '7': USE_BITS (OP_MASK_FUNCT7, OP_SH_FUNCT7); break;
658 case '3': USE_BITS (OP_MASK_FUNCT3, OP_SH_FUNCT3); break;
659 case '2': USE_BITS (OP_MASK_FUNCT2, OP_SH_FUNCT2); break;
660 default:
661 as_bad (_("internal: bad RISC-V opcode"
662 " (unknown operand type `F%c'): %s %s"),
663 c, opc->name, opc->args);
664 return FALSE;
665 }
666 break;
667 case 'O': /* opcode */
668 switch (c = *p++)
669 {
670 case '4': USE_BITS (OP_MASK_OP, OP_SH_OP); break;
671 case '2': USE_BITS (OP_MASK_OP2, OP_SH_OP2); break;
672 default:
673 as_bad (_("internal: bad RISC-V opcode"
674 " (unknown operand type `F%c'): %s %s"),
675 c, opc->name, opc->args);
676 return FALSE;
677 }
678 break;
679 default:
680 as_bad (_("internal: bad RISC-V opcode "
681 "(unknown operand type `%c'): %s %s"),
682 c, opc->name, opc->args);
683 return FALSE;
684 }
685 #undef USE_BITS
686 if (used_bits != required_bits)
687 {
688 as_bad (_("internal: bad RISC-V opcode (bits 0x%lx undefined): %s %s"),
689 ~(unsigned long)(used_bits & required_bits),
690 opc->name, opc->args);
691 return FALSE;
692 }
693 return TRUE;
694 }
695
696 struct percent_op_match
697 {
698 const char *str;
699 bfd_reloc_code_real_type reloc;
700 };
701
702 /* Common hash table initialization function for
703 instruction and .insn directive. */
704 static struct hash_control *
705 init_opcode_hash (const struct riscv_opcode *opcodes,
706 bfd_boolean insn_directive_p)
707 {
708 int i = 0;
709 int length;
710 struct hash_control *hash = hash_new ();
711 while (opcodes[i].name)
712 {
713 const char *name = opcodes[i].name;
714 const char *hash_error =
715 hash_insert (hash, name, (void *) &opcodes[i]);
716
717 if (hash_error)
718 {
719 fprintf (stderr, _("internal error: can't hash `%s': %s\n"),
720 opcodes[i].name, hash_error);
721 /* Probably a memory allocation problem? Give up now. */
722 as_fatal (_("Broken assembler. No assembly attempted."));
723 }
724
725 do
726 {
727 if (opcodes[i].pinfo != INSN_MACRO)
728 {
729 if (insn_directive_p)
730 length = ((name[0] == 'c') ? 2 : 4);
731 else
732 length = 0; /* Let assembler determine the length. */
733 if (!validate_riscv_insn (&opcodes[i], length))
734 as_fatal (_("Broken assembler. No assembly attempted."));
735 }
736 else
737 gas_assert (!insn_directive_p);
738 ++i;
739 }
740 while (opcodes[i].name && !strcmp (opcodes[i].name, name));
741 }
742
743 return hash;
744 }
745
746 /* This function is called once, at assembler startup time. It should set up
747 all the tables, etc. that the MD part of the assembler will need. */
748
749 void
750 md_begin (void)
751 {
752 unsigned long mach = xlen == 64 ? bfd_mach_riscv64 : bfd_mach_riscv32;
753
754 if (! bfd_set_arch_mach (stdoutput, bfd_arch_riscv, mach))
755 as_warn (_("Could not set architecture and machine"));
756
757 op_hash = init_opcode_hash (riscv_opcodes, FALSE);
758 insn_type_hash = init_opcode_hash (riscv_insn_types, TRUE);
759
760 reg_names_hash = hash_new ();
761 hash_reg_names (RCLASS_GPR, riscv_gpr_names_numeric, NGPR);
762 hash_reg_names (RCLASS_GPR, riscv_gpr_names_abi, NGPR);
763 hash_reg_names (RCLASS_FPR, riscv_fpr_names_numeric, NFPR);
764 hash_reg_names (RCLASS_FPR, riscv_fpr_names_abi, NFPR);
765
766 /* Add "fp" as an alias for "s0". */
767 hash_reg_name (RCLASS_GPR, "fp", 8);
768
769 opcode_names_hash = hash_new ();
770 init_opcode_names_hash ();
771
772 #define DECLARE_CSR(name, num) hash_reg_name (RCLASS_CSR, #name, num);
773 #define DECLARE_CSR_ALIAS(name, num) DECLARE_CSR(name, num);
774 #include "opcode/riscv-opc.h"
775 #undef DECLARE_CSR
776
777 /* Set the default alignment for the text section. */
778 record_alignment (text_section, riscv_opts.rvc ? 1 : 2);
779 }
780
781 static insn_t
782 riscv_apply_const_reloc (bfd_reloc_code_real_type reloc_type, bfd_vma value)
783 {
784 switch (reloc_type)
785 {
786 case BFD_RELOC_32:
787 return value;
788
789 case BFD_RELOC_RISCV_HI20:
790 return ENCODE_UTYPE_IMM (RISCV_CONST_HIGH_PART (value));
791
792 case BFD_RELOC_RISCV_LO12_S:
793 return ENCODE_STYPE_IMM (value);
794
795 case BFD_RELOC_RISCV_LO12_I:
796 return ENCODE_ITYPE_IMM (value);
797
798 default:
799 abort ();
800 }
801 }
802
803 /* Output an instruction. IP is the instruction information.
804 ADDRESS_EXPR is an operand of the instruction to be used with
805 RELOC_TYPE. */
806
807 static void
808 append_insn (struct riscv_cl_insn *ip, expressionS *address_expr,
809 bfd_reloc_code_real_type reloc_type)
810 {
811 dwarf2_emit_insn (0);
812
813 if (reloc_type != BFD_RELOC_UNUSED)
814 {
815 reloc_howto_type *howto;
816
817 gas_assert (address_expr);
818 if (reloc_type == BFD_RELOC_12_PCREL
819 || reloc_type == BFD_RELOC_RISCV_JMP)
820 {
821 int j = reloc_type == BFD_RELOC_RISCV_JMP;
822 int best_case = riscv_insn_length (ip->insn_opcode);
823 unsigned worst_case = relaxed_branch_length (NULL, NULL, 0);
824 add_relaxed_insn (ip, worst_case, best_case,
825 RELAX_BRANCH_ENCODE (j, best_case == 2, worst_case),
826 address_expr->X_add_symbol,
827 address_expr->X_add_number);
828 return;
829 }
830 else
831 {
832 howto = bfd_reloc_type_lookup (stdoutput, reloc_type);
833 if (howto == NULL)
834 as_bad (_("Unsupported RISC-V relocation number %d"), reloc_type);
835
836 ip->fixp = fix_new_exp (ip->frag, ip->where,
837 bfd_get_reloc_size (howto),
838 address_expr, FALSE, reloc_type);
839
840 ip->fixp->fx_tcbit = riscv_opts.relax;
841 }
842 }
843
844 add_fixed_insn (ip);
845 install_insn (ip);
846
847 /* We need to start a new frag after any instruction that can be
848 optimized away or compressed by the linker during relaxation, to prevent
849 the assembler from computing static offsets across such an instruction.
850 This is necessary to get correct EH info. */
851 if (reloc_type == BFD_RELOC_RISCV_CALL
852 || reloc_type == BFD_RELOC_RISCV_CALL_PLT
853 || reloc_type == BFD_RELOC_RISCV_HI20
854 || reloc_type == BFD_RELOC_RISCV_PCREL_HI20
855 || reloc_type == BFD_RELOC_RISCV_TPREL_HI20
856 || reloc_type == BFD_RELOC_RISCV_TPREL_ADD)
857 {
858 frag_wane (frag_now);
859 frag_new (0);
860 }
861 }
862
863 /* Build an instruction created by a macro expansion. This is passed
864 a pointer to the count of instructions created so far, an
865 expression, the name of the instruction to build, an operand format
866 string, and corresponding arguments. */
867
868 static void
869 macro_build (expressionS *ep, const char *name, const char *fmt, ...)
870 {
871 const struct riscv_opcode *mo;
872 struct riscv_cl_insn insn;
873 bfd_reloc_code_real_type r;
874 va_list args;
875
876 va_start (args, fmt);
877
878 r = BFD_RELOC_UNUSED;
879 mo = (struct riscv_opcode *) hash_find (op_hash, name);
880 gas_assert (mo);
881
882 /* Find a non-RVC variant of the instruction. append_insn will compress
883 it if possible. */
884 while (riscv_insn_length (mo->match) < 4)
885 mo++;
886 gas_assert (strcmp (name, mo->name) == 0);
887
888 create_insn (&insn, mo);
889 for (;;)
890 {
891 switch (*fmt++)
892 {
893 case 'd':
894 INSERT_OPERAND (RD, insn, va_arg (args, int));
895 continue;
896
897 case 's':
898 INSERT_OPERAND (RS1, insn, va_arg (args, int));
899 continue;
900
901 case 't':
902 INSERT_OPERAND (RS2, insn, va_arg (args, int));
903 continue;
904
905 case '>':
906 INSERT_OPERAND (SHAMT, insn, va_arg (args, int));
907 continue;
908
909 case 'j':
910 case 'u':
911 case 'q':
912 gas_assert (ep != NULL);
913 r = va_arg (args, int);
914 continue;
915
916 case '\0':
917 break;
918 case ',':
919 continue;
920 default:
921 as_fatal (_("internal error: invalid macro"));
922 }
923 break;
924 }
925 va_end (args);
926 gas_assert (r == BFD_RELOC_UNUSED ? ep == NULL : ep != NULL);
927
928 append_insn (&insn, ep, r);
929 }
930
931 /* Sign-extend 32-bit mode constants that have bit 31 set and all higher bits
932 unset. */
933 static void
934 normalize_constant_expr (expressionS *ex)
935 {
936 if (xlen > 32)
937 return;
938 if ((ex->X_op == O_constant || ex->X_op == O_symbol)
939 && IS_ZEXT_32BIT_NUM (ex->X_add_number))
940 ex->X_add_number = (((ex->X_add_number & 0xffffffff) ^ 0x80000000)
941 - 0x80000000);
942 }
943
944 /* Fail if an expression EX is not a constant. IP is the instruction using EX.
945 MAYBE_CSR is true if the symbol may be an unrecognized CSR name. */
946
947 static void
948 check_absolute_expr (struct riscv_cl_insn *ip, expressionS *ex,
949 bfd_boolean maybe_csr)
950 {
951 if (ex->X_op == O_big)
952 as_bad (_("unsupported large constant"));
953 else if (maybe_csr && ex->X_op == O_symbol)
954 as_bad (_("unknown CSR `%s'"),
955 S_GET_NAME (ex->X_add_symbol));
956 else if (ex->X_op != O_constant)
957 as_bad (_("Instruction %s requires absolute expression"),
958 ip->insn_mo->name);
959 normalize_constant_expr (ex);
960 }
961
962 static symbolS *
963 make_internal_label (void)
964 {
965 return (symbolS *) local_symbol_make (FAKE_LABEL_NAME, now_seg,
966 (valueT) frag_now_fix (), frag_now);
967 }
968
969 /* Load an entry from the GOT. */
970 static void
971 pcrel_access (int destreg, int tempreg, expressionS *ep,
972 const char *lo_insn, const char *lo_pattern,
973 bfd_reloc_code_real_type hi_reloc,
974 bfd_reloc_code_real_type lo_reloc)
975 {
976 expressionS ep2;
977 ep2.X_op = O_symbol;
978 ep2.X_add_symbol = make_internal_label ();
979 ep2.X_add_number = 0;
980
981 macro_build (ep, "auipc", "d,u", tempreg, hi_reloc);
982 macro_build (&ep2, lo_insn, lo_pattern, destreg, tempreg, lo_reloc);
983 }
984
985 static void
986 pcrel_load (int destreg, int tempreg, expressionS *ep, const char *lo_insn,
987 bfd_reloc_code_real_type hi_reloc,
988 bfd_reloc_code_real_type lo_reloc)
989 {
990 pcrel_access (destreg, tempreg, ep, lo_insn, "d,s,j", hi_reloc, lo_reloc);
991 }
992
993 static void
994 pcrel_store (int srcreg, int tempreg, expressionS *ep, const char *lo_insn,
995 bfd_reloc_code_real_type hi_reloc,
996 bfd_reloc_code_real_type lo_reloc)
997 {
998 pcrel_access (srcreg, tempreg, ep, lo_insn, "t,s,q", hi_reloc, lo_reloc);
999 }
1000
1001 /* PC-relative function call using AUIPC/JALR, relaxed to JAL. */
1002 static void
1003 riscv_call (int destreg, int tempreg, expressionS *ep,
1004 bfd_reloc_code_real_type reloc)
1005 {
1006 macro_build (ep, "auipc", "d,u", tempreg, reloc);
1007 macro_build (NULL, "jalr", "d,s", destreg, tempreg);
1008 }
1009
1010 /* Load an integer constant into a register. */
1011
1012 static void
1013 load_const (int reg, expressionS *ep)
1014 {
1015 int shift = RISCV_IMM_BITS;
1016 expressionS upper = *ep, lower = *ep;
1017 lower.X_add_number = (int32_t) ep->X_add_number << (32-shift) >> (32-shift);
1018 upper.X_add_number -= lower.X_add_number;
1019
1020 if (ep->X_op != O_constant)
1021 {
1022 as_bad (_("unsupported large constant"));
1023 return;
1024 }
1025
1026 if (xlen > 32 && !IS_SEXT_32BIT_NUM (ep->X_add_number))
1027 {
1028 /* Reduce to a signed 32-bit constant using SLLI and ADDI. */
1029 while (((upper.X_add_number >> shift) & 1) == 0)
1030 shift++;
1031
1032 upper.X_add_number = (int64_t) upper.X_add_number >> shift;
1033 load_const (reg, &upper);
1034
1035 macro_build (NULL, "slli", "d,s,>", reg, reg, shift);
1036 if (lower.X_add_number != 0)
1037 macro_build (&lower, "addi", "d,s,j", reg, reg, BFD_RELOC_RISCV_LO12_I);
1038 }
1039 else
1040 {
1041 /* Simply emit LUI and/or ADDI to build a 32-bit signed constant. */
1042 int hi_reg = 0;
1043
1044 if (upper.X_add_number != 0)
1045 {
1046 macro_build (ep, "lui", "d,u", reg, BFD_RELOC_RISCV_HI20);
1047 hi_reg = reg;
1048 }
1049
1050 if (lower.X_add_number != 0 || hi_reg == 0)
1051 macro_build (ep, ADD32_INSN, "d,s,j", reg, hi_reg,
1052 BFD_RELOC_RISCV_LO12_I);
1053 }
1054 }
1055
1056 /* Expand RISC-V assembly macros into one or more instructions. */
1057 static void
1058 macro (struct riscv_cl_insn *ip, expressionS *imm_expr,
1059 bfd_reloc_code_real_type *imm_reloc)
1060 {
1061 int rd = (ip->insn_opcode >> OP_SH_RD) & OP_MASK_RD;
1062 int rs1 = (ip->insn_opcode >> OP_SH_RS1) & OP_MASK_RS1;
1063 int rs2 = (ip->insn_opcode >> OP_SH_RS2) & OP_MASK_RS2;
1064 int mask = ip->insn_mo->mask;
1065
1066 switch (mask)
1067 {
1068 case M_LI:
1069 load_const (rd, imm_expr);
1070 break;
1071
1072 case M_LA:
1073 case M_LLA:
1074 /* Load the address of a symbol into a register. */
1075 if (!IS_SEXT_32BIT_NUM (imm_expr->X_add_number))
1076 as_bad (_("offset too large"));
1077
1078 if (imm_expr->X_op == O_constant)
1079 load_const (rd, imm_expr);
1080 else if (riscv_opts.pic && mask == M_LA) /* Global PIC symbol */
1081 pcrel_load (rd, rd, imm_expr, LOAD_ADDRESS_INSN,
1082 BFD_RELOC_RISCV_GOT_HI20, BFD_RELOC_RISCV_PCREL_LO12_I);
1083 else /* Local PIC symbol, or any non-PIC symbol */
1084 pcrel_load (rd, rd, imm_expr, "addi",
1085 BFD_RELOC_RISCV_PCREL_HI20, BFD_RELOC_RISCV_PCREL_LO12_I);
1086 break;
1087
1088 case M_LA_TLS_GD:
1089 pcrel_load (rd, rd, imm_expr, "addi",
1090 BFD_RELOC_RISCV_TLS_GD_HI20, BFD_RELOC_RISCV_PCREL_LO12_I);
1091 break;
1092
1093 case M_LA_TLS_IE:
1094 pcrel_load (rd, rd, imm_expr, LOAD_ADDRESS_INSN,
1095 BFD_RELOC_RISCV_TLS_GOT_HI20, BFD_RELOC_RISCV_PCREL_LO12_I);
1096 break;
1097
1098 case M_LB:
1099 pcrel_load (rd, rd, imm_expr, "lb",
1100 BFD_RELOC_RISCV_PCREL_HI20, BFD_RELOC_RISCV_PCREL_LO12_I);
1101 break;
1102
1103 case M_LBU:
1104 pcrel_load (rd, rd, imm_expr, "lbu",
1105 BFD_RELOC_RISCV_PCREL_HI20, BFD_RELOC_RISCV_PCREL_LO12_I);
1106 break;
1107
1108 case M_LH:
1109 pcrel_load (rd, rd, imm_expr, "lh",
1110 BFD_RELOC_RISCV_PCREL_HI20, BFD_RELOC_RISCV_PCREL_LO12_I);
1111 break;
1112
1113 case M_LHU:
1114 pcrel_load (rd, rd, imm_expr, "lhu",
1115 BFD_RELOC_RISCV_PCREL_HI20, BFD_RELOC_RISCV_PCREL_LO12_I);
1116 break;
1117
1118 case M_LW:
1119 pcrel_load (rd, rd, imm_expr, "lw",
1120 BFD_RELOC_RISCV_PCREL_HI20, BFD_RELOC_RISCV_PCREL_LO12_I);
1121 break;
1122
1123 case M_LWU:
1124 pcrel_load (rd, rd, imm_expr, "lwu",
1125 BFD_RELOC_RISCV_PCREL_HI20, BFD_RELOC_RISCV_PCREL_LO12_I);
1126 break;
1127
1128 case M_LD:
1129 pcrel_load (rd, rd, imm_expr, "ld",
1130 BFD_RELOC_RISCV_PCREL_HI20, BFD_RELOC_RISCV_PCREL_LO12_I);
1131 break;
1132
1133 case M_FLW:
1134 pcrel_load (rd, rs1, imm_expr, "flw",
1135 BFD_RELOC_RISCV_PCREL_HI20, BFD_RELOC_RISCV_PCREL_LO12_I);
1136 break;
1137
1138 case M_FLD:
1139 pcrel_load (rd, rs1, imm_expr, "fld",
1140 BFD_RELOC_RISCV_PCREL_HI20, BFD_RELOC_RISCV_PCREL_LO12_I);
1141 break;
1142
1143 case M_SB:
1144 pcrel_store (rs2, rs1, imm_expr, "sb",
1145 BFD_RELOC_RISCV_PCREL_HI20, BFD_RELOC_RISCV_PCREL_LO12_S);
1146 break;
1147
1148 case M_SH:
1149 pcrel_store (rs2, rs1, imm_expr, "sh",
1150 BFD_RELOC_RISCV_PCREL_HI20, BFD_RELOC_RISCV_PCREL_LO12_S);
1151 break;
1152
1153 case M_SW:
1154 pcrel_store (rs2, rs1, imm_expr, "sw",
1155 BFD_RELOC_RISCV_PCREL_HI20, BFD_RELOC_RISCV_PCREL_LO12_S);
1156 break;
1157
1158 case M_SD:
1159 pcrel_store (rs2, rs1, imm_expr, "sd",
1160 BFD_RELOC_RISCV_PCREL_HI20, BFD_RELOC_RISCV_PCREL_LO12_S);
1161 break;
1162
1163 case M_FSW:
1164 pcrel_store (rs2, rs1, imm_expr, "fsw",
1165 BFD_RELOC_RISCV_PCREL_HI20, BFD_RELOC_RISCV_PCREL_LO12_S);
1166 break;
1167
1168 case M_FSD:
1169 pcrel_store (rs2, rs1, imm_expr, "fsd",
1170 BFD_RELOC_RISCV_PCREL_HI20, BFD_RELOC_RISCV_PCREL_LO12_S);
1171 break;
1172
1173 case M_CALL:
1174 riscv_call (rd, rs1, imm_expr, *imm_reloc);
1175 break;
1176
1177 default:
1178 as_bad (_("Macro %s not implemented"), ip->insn_mo->name);
1179 break;
1180 }
1181 }
1182
1183 static const struct percent_op_match percent_op_utype[] =
1184 {
1185 {"%tprel_hi", BFD_RELOC_RISCV_TPREL_HI20},
1186 {"%pcrel_hi", BFD_RELOC_RISCV_PCREL_HI20},
1187 {"%tls_ie_pcrel_hi", BFD_RELOC_RISCV_TLS_GOT_HI20},
1188 {"%tls_gd_pcrel_hi", BFD_RELOC_RISCV_TLS_GD_HI20},
1189 {"%hi", BFD_RELOC_RISCV_HI20},
1190 {0, 0}
1191 };
1192
1193 static const struct percent_op_match percent_op_itype[] =
1194 {
1195 {"%lo", BFD_RELOC_RISCV_LO12_I},
1196 {"%tprel_lo", BFD_RELOC_RISCV_TPREL_LO12_I},
1197 {"%pcrel_lo", BFD_RELOC_RISCV_PCREL_LO12_I},
1198 {0, 0}
1199 };
1200
1201 static const struct percent_op_match percent_op_stype[] =
1202 {
1203 {"%lo", BFD_RELOC_RISCV_LO12_S},
1204 {"%tprel_lo", BFD_RELOC_RISCV_TPREL_LO12_S},
1205 {"%pcrel_lo", BFD_RELOC_RISCV_PCREL_LO12_S},
1206 {0, 0}
1207 };
1208
1209 static const struct percent_op_match percent_op_rtype[] =
1210 {
1211 {"%tprel_add", BFD_RELOC_RISCV_TPREL_ADD},
1212 {0, 0}
1213 };
1214
1215 static const struct percent_op_match percent_op_null[] =
1216 {
1217 {0, 0}
1218 };
1219
1220 /* Return true if *STR points to a relocation operator. When returning true,
1221 move *STR over the operator and store its relocation code in *RELOC.
1222 Leave both *STR and *RELOC alone when returning false. */
1223
1224 static bfd_boolean
1225 parse_relocation (char **str, bfd_reloc_code_real_type *reloc,
1226 const struct percent_op_match *percent_op)
1227 {
1228 for ( ; percent_op->str; percent_op++)
1229 if (strncasecmp (*str, percent_op->str, strlen (percent_op->str)) == 0)
1230 {
1231 int len = strlen (percent_op->str);
1232
1233 if (!ISSPACE ((*str)[len]) && (*str)[len] != '(')
1234 continue;
1235
1236 *str += strlen (percent_op->str);
1237 *reloc = percent_op->reloc;
1238
1239 /* Check whether the output BFD supports this relocation.
1240 If not, issue an error and fall back on something safe. */
1241 if (*reloc != BFD_RELOC_UNUSED
1242 && !bfd_reloc_type_lookup (stdoutput, *reloc))
1243 {
1244 as_bad ("relocation %s isn't supported by the current ABI",
1245 percent_op->str);
1246 *reloc = BFD_RELOC_UNUSED;
1247 }
1248 return TRUE;
1249 }
1250 return FALSE;
1251 }
1252
1253 static void
1254 my_getExpression (expressionS *ep, char *str)
1255 {
1256 char *save_in;
1257
1258 save_in = input_line_pointer;
1259 input_line_pointer = str;
1260 expression (ep);
1261 expr_end = input_line_pointer;
1262 input_line_pointer = save_in;
1263 }
1264
1265 /* Parse string STR as a 16-bit relocatable operand. Store the
1266 expression in *EP and the relocation, if any, in RELOC.
1267 Return the number of relocation operators used (0 or 1).
1268
1269 On exit, EXPR_END points to the first character after the expression. */
1270
1271 static size_t
1272 my_getSmallExpression (expressionS *ep, bfd_reloc_code_real_type *reloc,
1273 char *str, const struct percent_op_match *percent_op)
1274 {
1275 size_t reloc_index;
1276 unsigned crux_depth, str_depth, regno;
1277 char *crux;
1278
1279 /* First, check for integer registers. No callers can accept a reg, but
1280 we need to avoid accidentally creating a useless undefined symbol below,
1281 if this is an instruction pattern that can't match. A glibc build fails
1282 if this is removed. */
1283 if (reg_lookup (&str, RCLASS_GPR, &regno))
1284 {
1285 ep->X_op = O_register;
1286 ep->X_add_number = regno;
1287 expr_end = str;
1288 return 0;
1289 }
1290
1291 /* Search for the start of the main expression.
1292 End the loop with CRUX pointing to the start
1293 of the main expression and with CRUX_DEPTH containing the number
1294 of open brackets at that point. */
1295 reloc_index = -1;
1296 str_depth = 0;
1297 do
1298 {
1299 reloc_index++;
1300 crux = str;
1301 crux_depth = str_depth;
1302
1303 /* Skip over whitespace and brackets, keeping count of the number
1304 of brackets. */
1305 while (*str == ' ' || *str == '\t' || *str == '(')
1306 if (*str++ == '(')
1307 str_depth++;
1308 }
1309 while (*str == '%'
1310 && reloc_index < 1
1311 && parse_relocation (&str, reloc, percent_op));
1312
1313 my_getExpression (ep, crux);
1314 str = expr_end;
1315
1316 /* Match every open bracket. */
1317 while (crux_depth > 0 && (*str == ')' || *str == ' ' || *str == '\t'))
1318 if (*str++ == ')')
1319 crux_depth--;
1320
1321 if (crux_depth > 0)
1322 as_bad ("unclosed '('");
1323
1324 expr_end = str;
1325
1326 return reloc_index;
1327 }
1328
1329 /* Parse opcode name, could be an mnemonics or number. */
1330 static size_t
1331 my_getOpcodeExpression (expressionS *ep, bfd_reloc_code_real_type *reloc,
1332 char *str, const struct percent_op_match *percent_op)
1333 {
1334 const struct opcode_name_t *o = opcode_name_lookup (&str);
1335
1336 if (o != NULL)
1337 {
1338 ep->X_op = O_constant;
1339 ep->X_add_number = o->val;
1340 return 0;
1341 }
1342
1343 return my_getSmallExpression (ep, reloc, str, percent_op);
1344 }
1345
1346 /* Detect and handle implicitly zero load-store offsets. For example,
1347 "lw t0, (t1)" is shorthand for "lw t0, 0(t1)". Return TRUE iff such
1348 an implicit offset was detected. */
1349
1350 static bfd_boolean
1351 riscv_handle_implicit_zero_offset (expressionS *ep, const char *s)
1352 {
1353 /* Check whether there is only a single bracketed expression left.
1354 If so, it must be the base register and the constant must be zero. */
1355 if (*s == '(' && strchr (s + 1, '(') == 0)
1356 {
1357 ep->X_op = O_constant;
1358 ep->X_add_number = 0;
1359 return TRUE;
1360 }
1361
1362 return FALSE;
1363 }
1364
1365 /* This routine assembles an instruction into its binary format. As a
1366 side effect, it sets the global variable imm_reloc to the type of
1367 relocation to do if one of the operands is an address expression. */
1368
1369 static const char *
1370 riscv_ip (char *str, struct riscv_cl_insn *ip, expressionS *imm_expr,
1371 bfd_reloc_code_real_type *imm_reloc, struct hash_control *hash)
1372 {
1373 char *s;
1374 const char *args;
1375 char c = 0;
1376 struct riscv_opcode *insn;
1377 char *argsStart;
1378 unsigned int regno;
1379 char save_c = 0;
1380 int argnum;
1381 const struct percent_op_match *p;
1382 const char *error = "unrecognized opcode";
1383
1384 /* Parse the name of the instruction. Terminate the string if whitespace
1385 is found so that hash_find only sees the name part of the string. */
1386 for (s = str; *s != '\0'; ++s)
1387 if (ISSPACE (*s))
1388 {
1389 save_c = *s;
1390 *s++ = '\0';
1391 break;
1392 }
1393
1394 insn = (struct riscv_opcode *) hash_find (hash, str);
1395
1396 argsStart = s;
1397 for ( ; insn && insn->name && strcmp (insn->name, str) == 0; insn++)
1398 {
1399 if ((insn->xlen_requirement != 0) && (xlen != insn->xlen_requirement))
1400 continue;
1401
1402 if (!riscv_multi_subset_supports (insn->subset))
1403 continue;
1404
1405 create_insn (ip, insn);
1406 argnum = 1;
1407
1408 imm_expr->X_op = O_absent;
1409 *imm_reloc = BFD_RELOC_UNUSED;
1410 p = percent_op_itype;
1411
1412 for (args = insn->args;; ++args)
1413 {
1414 s += strspn (s, " \t");
1415 switch (*args)
1416 {
1417 case '\0': /* End of args. */
1418 if (insn->pinfo != INSN_MACRO)
1419 {
1420 if (!insn->match_func (insn, ip->insn_opcode))
1421 break;
1422
1423 /* For .insn, insn->match and insn->mask are 0. */
1424 if (riscv_insn_length ((insn->match == 0 && insn->mask == 0)
1425 ? ip->insn_opcode
1426 : insn->match) == 2
1427 && !riscv_opts.rvc)
1428 break;
1429 }
1430 if (*s != '\0')
1431 break;
1432 /* Successful assembly. */
1433 error = NULL;
1434 goto out;
1435
1436 case 'C': /* RVC */
1437 switch (*++args)
1438 {
1439 case 's': /* RS1 x8-x15 */
1440 if (!reg_lookup (&s, RCLASS_GPR, &regno)
1441 || !(regno >= 8 && regno <= 15))
1442 break;
1443 INSERT_OPERAND (CRS1S, *ip, regno % 8);
1444 continue;
1445 case 'w': /* RS1 x8-x15, constrained to equal RD x8-x15. */
1446 if (!reg_lookup (&s, RCLASS_GPR, &regno)
1447 || EXTRACT_OPERAND (CRS1S, ip->insn_opcode) + 8 != regno)
1448 break;
1449 continue;
1450 case 't': /* RS2 x8-x15 */
1451 if (!reg_lookup (&s, RCLASS_GPR, &regno)
1452 || !(regno >= 8 && regno <= 15))
1453 break;
1454 INSERT_OPERAND (CRS2S, *ip, regno % 8);
1455 continue;
1456 case 'x': /* RS2 x8-x15, constrained to equal RD x8-x15. */
1457 if (!reg_lookup (&s, RCLASS_GPR, &regno)
1458 || EXTRACT_OPERAND (CRS2S, ip->insn_opcode) + 8 != regno)
1459 break;
1460 continue;
1461 case 'U': /* RS1, constrained to equal RD. */
1462 if (!reg_lookup (&s, RCLASS_GPR, &regno)
1463 || EXTRACT_OPERAND (RD, ip->insn_opcode) != regno)
1464 break;
1465 continue;
1466 case 'V': /* RS2 */
1467 if (!reg_lookup (&s, RCLASS_GPR, &regno))
1468 break;
1469 INSERT_OPERAND (CRS2, *ip, regno);
1470 continue;
1471 case 'c': /* RS1, constrained to equal sp. */
1472 if (!reg_lookup (&s, RCLASS_GPR, &regno)
1473 || regno != X_SP)
1474 break;
1475 continue;
1476 case 'z': /* RS2, contrained to equal x0. */
1477 if (!reg_lookup (&s, RCLASS_GPR, &regno)
1478 || regno != 0)
1479 break;
1480 continue;
1481 case '>':
1482 if (my_getSmallExpression (imm_expr, imm_reloc, s, p)
1483 || imm_expr->X_op != O_constant
1484 || imm_expr->X_add_number <= 0
1485 || imm_expr->X_add_number >= 64)
1486 break;
1487 ip->insn_opcode |= ENCODE_RVC_IMM (imm_expr->X_add_number);
1488 rvc_imm_done:
1489 s = expr_end;
1490 imm_expr->X_op = O_absent;
1491 continue;
1492 case '<':
1493 if (my_getSmallExpression (imm_expr, imm_reloc, s, p)
1494 || imm_expr->X_op != O_constant
1495 || !VALID_RVC_IMM (imm_expr->X_add_number)
1496 || imm_expr->X_add_number <= 0
1497 || imm_expr->X_add_number >= 32)
1498 break;
1499 ip->insn_opcode |= ENCODE_RVC_IMM (imm_expr->X_add_number);
1500 goto rvc_imm_done;
1501 case '8':
1502 if (my_getSmallExpression (imm_expr, imm_reloc, s, p)
1503 || imm_expr->X_op != O_constant
1504 || !VALID_RVC_UIMM8 (imm_expr->X_add_number)
1505 || imm_expr->X_add_number < 0
1506 || imm_expr->X_add_number >= 256)
1507 break;
1508 ip->insn_opcode |= ENCODE_RVC_UIMM8 (imm_expr->X_add_number);
1509 goto rvc_imm_done;
1510 case 'i':
1511 if (my_getSmallExpression (imm_expr, imm_reloc, s, p)
1512 || imm_expr->X_op != O_constant
1513 || imm_expr->X_add_number == 0
1514 || !VALID_RVC_SIMM3 (imm_expr->X_add_number))
1515 break;
1516 ip->insn_opcode |= ENCODE_RVC_SIMM3 (imm_expr->X_add_number);
1517 goto rvc_imm_done;
1518 case 'j':
1519 if (my_getSmallExpression (imm_expr, imm_reloc, s, p)
1520 || imm_expr->X_op != O_constant
1521 || imm_expr->X_add_number == 0
1522 || !VALID_RVC_IMM (imm_expr->X_add_number))
1523 break;
1524 ip->insn_opcode |= ENCODE_RVC_IMM (imm_expr->X_add_number);
1525 goto rvc_imm_done;
1526 case 'k':
1527 if (riscv_handle_implicit_zero_offset (imm_expr, s))
1528 continue;
1529 if (my_getSmallExpression (imm_expr, imm_reloc, s, p)
1530 || imm_expr->X_op != O_constant
1531 || !VALID_RVC_LW_IMM (imm_expr->X_add_number))
1532 break;
1533 ip->insn_opcode |= ENCODE_RVC_LW_IMM (imm_expr->X_add_number);
1534 goto rvc_imm_done;
1535 case 'l':
1536 if (riscv_handle_implicit_zero_offset (imm_expr, s))
1537 continue;
1538 if (my_getSmallExpression (imm_expr, imm_reloc, s, p)
1539 || imm_expr->X_op != O_constant
1540 || !VALID_RVC_LD_IMM (imm_expr->X_add_number))
1541 break;
1542 ip->insn_opcode |= ENCODE_RVC_LD_IMM (imm_expr->X_add_number);
1543 goto rvc_imm_done;
1544 case 'm':
1545 if (riscv_handle_implicit_zero_offset (imm_expr, s))
1546 continue;
1547 if (my_getSmallExpression (imm_expr, imm_reloc, s, p)
1548 || imm_expr->X_op != O_constant
1549 || !VALID_RVC_LWSP_IMM (imm_expr->X_add_number))
1550 break;
1551 ip->insn_opcode |=
1552 ENCODE_RVC_LWSP_IMM (imm_expr->X_add_number);
1553 goto rvc_imm_done;
1554 case 'n':
1555 if (riscv_handle_implicit_zero_offset (imm_expr, s))
1556 continue;
1557 if (my_getSmallExpression (imm_expr, imm_reloc, s, p)
1558 || imm_expr->X_op != O_constant
1559 || !VALID_RVC_LDSP_IMM (imm_expr->X_add_number))
1560 break;
1561 ip->insn_opcode |=
1562 ENCODE_RVC_LDSP_IMM (imm_expr->X_add_number);
1563 goto rvc_imm_done;
1564 case 'o':
1565 if (my_getSmallExpression (imm_expr, imm_reloc, s, p)
1566 || imm_expr->X_op != O_constant
1567 /* C.addiw, c.li, and c.andi allow zero immediate.
1568 C.addi allows zero immediate as hint. Otherwise this
1569 is same as 'j'. */
1570 || !VALID_RVC_IMM (imm_expr->X_add_number))
1571 break;
1572 ip->insn_opcode |= ENCODE_RVC_IMM (imm_expr->X_add_number);
1573 goto rvc_imm_done;
1574 case 'K':
1575 if (my_getSmallExpression (imm_expr, imm_reloc, s, p)
1576 || imm_expr->X_op != O_constant
1577 || !VALID_RVC_ADDI4SPN_IMM (imm_expr->X_add_number)
1578 || imm_expr->X_add_number == 0)
1579 break;
1580 ip->insn_opcode |=
1581 ENCODE_RVC_ADDI4SPN_IMM (imm_expr->X_add_number);
1582 goto rvc_imm_done;
1583 case 'L':
1584 if (my_getSmallExpression (imm_expr, imm_reloc, s, p)
1585 || imm_expr->X_op != O_constant
1586 || !VALID_RVC_ADDI16SP_IMM (imm_expr->X_add_number)
1587 || imm_expr->X_add_number == 0)
1588 break;
1589 ip->insn_opcode |=
1590 ENCODE_RVC_ADDI16SP_IMM (imm_expr->X_add_number);
1591 goto rvc_imm_done;
1592 case 'M':
1593 if (riscv_handle_implicit_zero_offset (imm_expr, s))
1594 continue;
1595 if (my_getSmallExpression (imm_expr, imm_reloc, s, p)
1596 || imm_expr->X_op != O_constant
1597 || !VALID_RVC_SWSP_IMM (imm_expr->X_add_number))
1598 break;
1599 ip->insn_opcode |=
1600 ENCODE_RVC_SWSP_IMM (imm_expr->X_add_number);
1601 goto rvc_imm_done;
1602 case 'N':
1603 if (riscv_handle_implicit_zero_offset (imm_expr, s))
1604 continue;
1605 if (my_getSmallExpression (imm_expr, imm_reloc, s, p)
1606 || imm_expr->X_op != O_constant
1607 || !VALID_RVC_SDSP_IMM (imm_expr->X_add_number))
1608 break;
1609 ip->insn_opcode |=
1610 ENCODE_RVC_SDSP_IMM (imm_expr->X_add_number);
1611 goto rvc_imm_done;
1612 case 'u':
1613 p = percent_op_utype;
1614 if (my_getSmallExpression (imm_expr, imm_reloc, s, p))
1615 break;
1616 rvc_lui:
1617 if (imm_expr->X_op != O_constant
1618 || imm_expr->X_add_number <= 0
1619 || imm_expr->X_add_number >= RISCV_BIGIMM_REACH
1620 || (imm_expr->X_add_number >= RISCV_RVC_IMM_REACH / 2
1621 && (imm_expr->X_add_number <
1622 RISCV_BIGIMM_REACH - RISCV_RVC_IMM_REACH / 2)))
1623 break;
1624 ip->insn_opcode |= ENCODE_RVC_IMM (imm_expr->X_add_number);
1625 goto rvc_imm_done;
1626 case 'v':
1627 if (my_getSmallExpression (imm_expr, imm_reloc, s, p)
1628 || (imm_expr->X_add_number & (RISCV_IMM_REACH - 1))
1629 || ((int32_t)imm_expr->X_add_number
1630 != imm_expr->X_add_number))
1631 break;
1632 imm_expr->X_add_number =
1633 ((uint32_t) imm_expr->X_add_number) >> RISCV_IMM_BITS;
1634 goto rvc_lui;
1635 case 'p':
1636 goto branch;
1637 case 'a':
1638 goto jump;
1639 case 'S': /* Floating-point RS1 x8-x15. */
1640 if (!reg_lookup (&s, RCLASS_FPR, &regno)
1641 || !(regno >= 8 && regno <= 15))
1642 break;
1643 INSERT_OPERAND (CRS1S, *ip, regno % 8);
1644 continue;
1645 case 'D': /* Floating-point RS2 x8-x15. */
1646 if (!reg_lookup (&s, RCLASS_FPR, &regno)
1647 || !(regno >= 8 && regno <= 15))
1648 break;
1649 INSERT_OPERAND (CRS2S, *ip, regno % 8);
1650 continue;
1651 case 'T': /* Floating-point RS2. */
1652 if (!reg_lookup (&s, RCLASS_FPR, &regno))
1653 break;
1654 INSERT_OPERAND (CRS2, *ip, regno);
1655 continue;
1656 case 'F':
1657 switch (*++args)
1658 {
1659 case '6':
1660 if (my_getSmallExpression (imm_expr, imm_reloc, s, p)
1661 || imm_expr->X_op != O_constant
1662 || imm_expr->X_add_number < 0
1663 || imm_expr->X_add_number >= 64)
1664 {
1665 as_bad (_("bad value for funct6 field, "
1666 "value must be 0...64"));
1667 break;
1668 }
1669
1670 INSERT_OPERAND (CFUNCT6, *ip, imm_expr->X_add_number);
1671 imm_expr->X_op = O_absent;
1672 s = expr_end;
1673 continue;
1674 case '4':
1675 if (my_getSmallExpression (imm_expr, imm_reloc, s, p)
1676 || imm_expr->X_op != O_constant
1677 || imm_expr->X_add_number < 0
1678 || imm_expr->X_add_number >= 16)
1679 {
1680 as_bad (_("bad value for funct4 field, "
1681 "value must be 0...15"));
1682 break;
1683 }
1684
1685 INSERT_OPERAND (CFUNCT4, *ip, imm_expr->X_add_number);
1686 imm_expr->X_op = O_absent;
1687 s = expr_end;
1688 continue;
1689 case '3':
1690 if (my_getSmallExpression (imm_expr, imm_reloc, s, p)
1691 || imm_expr->X_op != O_constant
1692 || imm_expr->X_add_number < 0
1693 || imm_expr->X_add_number >= 8)
1694 {
1695 as_bad (_("bad value for funct3 field, "
1696 "value must be 0...7"));
1697 break;
1698 }
1699 INSERT_OPERAND (CFUNCT3, *ip, imm_expr->X_add_number);
1700 imm_expr->X_op = O_absent;
1701 s = expr_end;
1702 continue;
1703 case '2':
1704 if (my_getSmallExpression (imm_expr, imm_reloc, s, p)
1705 || imm_expr->X_op != O_constant
1706 || imm_expr->X_add_number < 0
1707 || imm_expr->X_add_number >= 4)
1708 {
1709 as_bad (_("bad value for funct2 field, "
1710 "value must be 0...3"));
1711 break;
1712 }
1713 INSERT_OPERAND (CFUNCT2, *ip, imm_expr->X_add_number);
1714 imm_expr->X_op = O_absent;
1715 s = expr_end;
1716 continue;
1717 default:
1718 as_bad (_("bad compressed FUNCT field"
1719 " specifier 'CF%c'\n"),
1720 *args);
1721 }
1722 break;
1723
1724 default:
1725 as_bad (_("bad RVC field specifier 'C%c'\n"), *args);
1726 }
1727 break;
1728
1729 case ',':
1730 ++argnum;
1731 if (*s++ == *args)
1732 continue;
1733 s--;
1734 break;
1735
1736 case '(':
1737 case ')':
1738 case '[':
1739 case ']':
1740 if (*s++ == *args)
1741 continue;
1742 break;
1743
1744 case '<': /* Shift amount, 0 - 31. */
1745 my_getExpression (imm_expr, s);
1746 check_absolute_expr (ip, imm_expr, FALSE);
1747 if ((unsigned long) imm_expr->X_add_number > 31)
1748 as_bad (_("Improper shift amount (%lu)"),
1749 (unsigned long) imm_expr->X_add_number);
1750 INSERT_OPERAND (SHAMTW, *ip, imm_expr->X_add_number);
1751 imm_expr->X_op = O_absent;
1752 s = expr_end;
1753 continue;
1754
1755 case '>': /* Shift amount, 0 - (XLEN-1). */
1756 my_getExpression (imm_expr, s);
1757 check_absolute_expr (ip, imm_expr, FALSE);
1758 if ((unsigned long) imm_expr->X_add_number >= xlen)
1759 as_bad (_("Improper shift amount (%lu)"),
1760 (unsigned long) imm_expr->X_add_number);
1761 INSERT_OPERAND (SHAMT, *ip, imm_expr->X_add_number);
1762 imm_expr->X_op = O_absent;
1763 s = expr_end;
1764 continue;
1765
1766 case 'Z': /* CSRRxI immediate. */
1767 my_getExpression (imm_expr, s);
1768 check_absolute_expr (ip, imm_expr, FALSE);
1769 if ((unsigned long) imm_expr->X_add_number > 31)
1770 as_bad (_("Improper CSRxI immediate (%lu)"),
1771 (unsigned long) imm_expr->X_add_number);
1772 INSERT_OPERAND (RS1, *ip, imm_expr->X_add_number);
1773 imm_expr->X_op = O_absent;
1774 s = expr_end;
1775 continue;
1776
1777 case 'E': /* Control register. */
1778 if (reg_lookup (&s, RCLASS_CSR, &regno))
1779 INSERT_OPERAND (CSR, *ip, regno);
1780 else
1781 {
1782 my_getExpression (imm_expr, s);
1783 check_absolute_expr (ip, imm_expr, TRUE);
1784 if ((unsigned long) imm_expr->X_add_number > 0xfff)
1785 as_bad (_("Improper CSR address (%lu)"),
1786 (unsigned long) imm_expr->X_add_number);
1787 INSERT_OPERAND (CSR, *ip, imm_expr->X_add_number);
1788 imm_expr->X_op = O_absent;
1789 s = expr_end;
1790 }
1791 continue;
1792
1793 case 'm': /* Rounding mode. */
1794 if (arg_lookup (&s, riscv_rm, ARRAY_SIZE (riscv_rm), &regno))
1795 {
1796 INSERT_OPERAND (RM, *ip, regno);
1797 continue;
1798 }
1799 break;
1800
1801 case 'P':
1802 case 'Q': /* Fence predecessor/successor. */
1803 if (arg_lookup (&s, riscv_pred_succ, ARRAY_SIZE (riscv_pred_succ),
1804 &regno))
1805 {
1806 if (*args == 'P')
1807 INSERT_OPERAND (PRED, *ip, regno);
1808 else
1809 INSERT_OPERAND (SUCC, *ip, regno);
1810 continue;
1811 }
1812 break;
1813
1814 case 'd': /* Destination register. */
1815 case 's': /* Source register. */
1816 case 't': /* Target register. */
1817 case 'r': /* rs3. */
1818 if (reg_lookup (&s, RCLASS_GPR, &regno))
1819 {
1820 c = *args;
1821 if (*s == ' ')
1822 ++s;
1823
1824 /* Now that we have assembled one operand, we use the args
1825 string to figure out where it goes in the instruction. */
1826 switch (c)
1827 {
1828 case 's':
1829 INSERT_OPERAND (RS1, *ip, regno);
1830 break;
1831 case 'd':
1832 INSERT_OPERAND (RD, *ip, regno);
1833 break;
1834 case 't':
1835 INSERT_OPERAND (RS2, *ip, regno);
1836 break;
1837 case 'r':
1838 INSERT_OPERAND (RS3, *ip, regno);
1839 break;
1840 }
1841 continue;
1842 }
1843 break;
1844
1845 case 'D': /* Floating point rd. */
1846 case 'S': /* Floating point rs1. */
1847 case 'T': /* Floating point rs2. */
1848 case 'U': /* Floating point rs1 and rs2. */
1849 case 'R': /* Floating point rs3. */
1850 if (reg_lookup (&s, RCLASS_FPR, &regno))
1851 {
1852 c = *args;
1853 if (*s == ' ')
1854 ++s;
1855 switch (c)
1856 {
1857 case 'D':
1858 INSERT_OPERAND (RD, *ip, regno);
1859 break;
1860 case 'S':
1861 INSERT_OPERAND (RS1, *ip, regno);
1862 break;
1863 case 'U':
1864 INSERT_OPERAND (RS1, *ip, regno);
1865 /* fallthru */
1866 case 'T':
1867 INSERT_OPERAND (RS2, *ip, regno);
1868 break;
1869 case 'R':
1870 INSERT_OPERAND (RS3, *ip, regno);
1871 break;
1872 }
1873 continue;
1874 }
1875
1876 break;
1877
1878 case 'I':
1879 my_getExpression (imm_expr, s);
1880 if (imm_expr->X_op != O_big
1881 && imm_expr->X_op != O_constant)
1882 break;
1883 normalize_constant_expr (imm_expr);
1884 s = expr_end;
1885 continue;
1886
1887 case 'A':
1888 my_getExpression (imm_expr, s);
1889 normalize_constant_expr (imm_expr);
1890 /* The 'A' format specifier must be a symbol. */
1891 if (imm_expr->X_op != O_symbol)
1892 break;
1893 *imm_reloc = BFD_RELOC_32;
1894 s = expr_end;
1895 continue;
1896
1897 case 'B':
1898 my_getExpression (imm_expr, s);
1899 normalize_constant_expr (imm_expr);
1900 /* The 'B' format specifier must be a symbol or a constant. */
1901 if (imm_expr->X_op != O_symbol && imm_expr->X_op != O_constant)
1902 break;
1903 if (imm_expr->X_op == O_symbol)
1904 *imm_reloc = BFD_RELOC_32;
1905 s = expr_end;
1906 continue;
1907
1908 case 'j': /* Sign-extended immediate. */
1909 p = percent_op_itype;
1910 *imm_reloc = BFD_RELOC_RISCV_LO12_I;
1911 goto alu_op;
1912 case 'q': /* Store displacement. */
1913 p = percent_op_stype;
1914 *imm_reloc = BFD_RELOC_RISCV_LO12_S;
1915 goto load_store;
1916 case 'o': /* Load displacement. */
1917 p = percent_op_itype;
1918 *imm_reloc = BFD_RELOC_RISCV_LO12_I;
1919 goto load_store;
1920 case '1': /* 4-operand add, must be %tprel_add. */
1921 p = percent_op_rtype;
1922 goto alu_op;
1923 case '0': /* AMO "displacement," which must be zero. */
1924 p = percent_op_null;
1925 load_store:
1926 if (riscv_handle_implicit_zero_offset (imm_expr, s))
1927 continue;
1928 alu_op:
1929 /* If this value won't fit into a 16 bit offset, then go
1930 find a macro that will generate the 32 bit offset
1931 code pattern. */
1932 if (!my_getSmallExpression (imm_expr, imm_reloc, s, p))
1933 {
1934 normalize_constant_expr (imm_expr);
1935 if (imm_expr->X_op != O_constant
1936 || (*args == '0' && imm_expr->X_add_number != 0)
1937 || (*args == '1')
1938 || imm_expr->X_add_number >= (signed)RISCV_IMM_REACH/2
1939 || imm_expr->X_add_number < -(signed)RISCV_IMM_REACH/2)
1940 break;
1941 }
1942
1943 s = expr_end;
1944 continue;
1945
1946 case 'p': /* PC-relative offset. */
1947 branch:
1948 *imm_reloc = BFD_RELOC_12_PCREL;
1949 my_getExpression (imm_expr, s);
1950 s = expr_end;
1951 continue;
1952
1953 case 'u': /* Upper 20 bits. */
1954 p = percent_op_utype;
1955 if (!my_getSmallExpression (imm_expr, imm_reloc, s, p)
1956 && imm_expr->X_op == O_constant)
1957 {
1958 if (imm_expr->X_add_number < 0
1959 || imm_expr->X_add_number >= (signed)RISCV_BIGIMM_REACH)
1960 as_bad (_("lui expression not in range 0..1048575"));
1961
1962 *imm_reloc = BFD_RELOC_RISCV_HI20;
1963 imm_expr->X_add_number <<= RISCV_IMM_BITS;
1964 }
1965 /* The 'u' format specifier must be a symbol or a constant. */
1966 if (imm_expr->X_op != O_symbol && imm_expr->X_op != O_constant)
1967 break;
1968 s = expr_end;
1969 continue;
1970
1971 case 'a': /* 20-bit PC-relative offset. */
1972 jump:
1973 my_getExpression (imm_expr, s);
1974 s = expr_end;
1975 *imm_reloc = BFD_RELOC_RISCV_JMP;
1976 continue;
1977
1978 case 'c':
1979 my_getExpression (imm_expr, s);
1980 s = expr_end;
1981 if (strcmp (s, "@plt") == 0)
1982 {
1983 *imm_reloc = BFD_RELOC_RISCV_CALL_PLT;
1984 s += 4;
1985 }
1986 else
1987 *imm_reloc = BFD_RELOC_RISCV_CALL;
1988 continue;
1989 case 'O':
1990 switch (*++args)
1991 {
1992 case '4':
1993 if (my_getOpcodeExpression (imm_expr, imm_reloc, s, p)
1994 || imm_expr->X_op != O_constant
1995 || imm_expr->X_add_number < 0
1996 || imm_expr->X_add_number >= 128
1997 || (imm_expr->X_add_number & 0x3) != 3)
1998 {
1999 as_bad (_("bad value for opcode field, "
2000 "value must be 0...127 and "
2001 "lower 2 bits must be 0x3"));
2002 break;
2003 }
2004
2005 INSERT_OPERAND (OP, *ip, imm_expr->X_add_number);
2006 imm_expr->X_op = O_absent;
2007 s = expr_end;
2008 continue;
2009 case '2':
2010 if (my_getOpcodeExpression (imm_expr, imm_reloc, s, p)
2011 || imm_expr->X_op != O_constant
2012 || imm_expr->X_add_number < 0
2013 || imm_expr->X_add_number >= 3)
2014 {
2015 as_bad (_("bad value for opcode field, "
2016 "value must be 0...2"));
2017 break;
2018 }
2019
2020 INSERT_OPERAND (OP2, *ip, imm_expr->X_add_number);
2021 imm_expr->X_op = O_absent;
2022 s = expr_end;
2023 continue;
2024 default:
2025 as_bad (_("bad Opcode field specifier 'O%c'\n"), *args);
2026 }
2027 break;
2028
2029 case 'F':
2030 switch (*++args)
2031 {
2032 case '7':
2033 if (my_getSmallExpression (imm_expr, imm_reloc, s, p)
2034 || imm_expr->X_op != O_constant
2035 || imm_expr->X_add_number < 0
2036 || imm_expr->X_add_number >= 128)
2037 {
2038 as_bad (_("bad value for funct7 field, "
2039 "value must be 0...127"));
2040 break;
2041 }
2042
2043 INSERT_OPERAND (FUNCT7, *ip, imm_expr->X_add_number);
2044 imm_expr->X_op = O_absent;
2045 s = expr_end;
2046 continue;
2047 case '3':
2048 if (my_getSmallExpression (imm_expr, imm_reloc, s, p)
2049 || imm_expr->X_op != O_constant
2050 || imm_expr->X_add_number < 0
2051 || imm_expr->X_add_number >= 8)
2052 {
2053 as_bad (_("bad value for funct3 field, "
2054 "value must be 0...7"));
2055 break;
2056 }
2057
2058 INSERT_OPERAND (FUNCT3, *ip, imm_expr->X_add_number);
2059 imm_expr->X_op = O_absent;
2060 s = expr_end;
2061 continue;
2062 case '2':
2063 if (my_getSmallExpression (imm_expr, imm_reloc, s, p)
2064 || imm_expr->X_op != O_constant
2065 || imm_expr->X_add_number < 0
2066 || imm_expr->X_add_number >= 4)
2067 {
2068 as_bad (_("bad value for funct2 field, "
2069 "value must be 0...3"));
2070 break;
2071 }
2072
2073 INSERT_OPERAND (FUNCT2, *ip, imm_expr->X_add_number);
2074 imm_expr->X_op = O_absent;
2075 s = expr_end;
2076 continue;
2077
2078 default:
2079 as_bad (_("bad FUNCT field specifier 'F%c'\n"), *args);
2080 }
2081 break;
2082
2083 case 'z':
2084 if (my_getSmallExpression (imm_expr, imm_reloc, s, p)
2085 || imm_expr->X_op != O_constant
2086 || imm_expr->X_add_number != 0)
2087 break;
2088 s = expr_end;
2089 imm_expr->X_op = O_absent;
2090 continue;
2091
2092 default:
2093 as_fatal (_("internal error: bad argument type %c"), *args);
2094 }
2095 break;
2096 }
2097 s = argsStart;
2098 error = _("illegal operands");
2099 }
2100
2101 out:
2102 /* Restore the character we might have clobbered above. */
2103 if (save_c)
2104 *(argsStart - 1) = save_c;
2105
2106 return error;
2107 }
2108
2109 void
2110 md_assemble (char *str)
2111 {
2112 struct riscv_cl_insn insn;
2113 expressionS imm_expr;
2114 bfd_reloc_code_real_type imm_reloc = BFD_RELOC_UNUSED;
2115
2116 const char *error = riscv_ip (str, &insn, &imm_expr, &imm_reloc, op_hash);
2117
2118 start_assemble = TRUE;
2119
2120 if (error)
2121 {
2122 as_bad ("%s `%s'", error, str);
2123 return;
2124 }
2125
2126 if (insn.insn_mo->pinfo == INSN_MACRO)
2127 macro (&insn, &imm_expr, &imm_reloc);
2128 else
2129 append_insn (&insn, &imm_expr, imm_reloc);
2130 }
2131
2132 const char *
2133 md_atof (int type, char *litP, int *sizeP)
2134 {
2135 return ieee_md_atof (type, litP, sizeP, TARGET_BYTES_BIG_ENDIAN);
2136 }
2137
2138 void
2139 md_number_to_chars (char *buf, valueT val, int n)
2140 {
2141 number_to_chars_littleendian (buf, val, n);
2142 }
2143
2144 const char *md_shortopts = "O::g::G:";
2145
2146 enum options
2147 {
2148 OPTION_MARCH = OPTION_MD_BASE,
2149 OPTION_PIC,
2150 OPTION_NO_PIC,
2151 OPTION_MABI,
2152 OPTION_RELAX,
2153 OPTION_NO_RELAX,
2154 OPTION_ARCH_ATTR,
2155 OPTION_NO_ARCH_ATTR,
2156 OPTION_END_OF_ENUM
2157 };
2158
2159 struct option md_longopts[] =
2160 {
2161 {"march", required_argument, NULL, OPTION_MARCH},
2162 {"fPIC", no_argument, NULL, OPTION_PIC},
2163 {"fpic", no_argument, NULL, OPTION_PIC},
2164 {"fno-pic", no_argument, NULL, OPTION_NO_PIC},
2165 {"mabi", required_argument, NULL, OPTION_MABI},
2166 {"mrelax", no_argument, NULL, OPTION_RELAX},
2167 {"mno-relax", no_argument, NULL, OPTION_NO_RELAX},
2168 {"march-attr", no_argument, NULL, OPTION_ARCH_ATTR},
2169 {"mno-arch-attr", no_argument, NULL, OPTION_NO_ARCH_ATTR},
2170
2171 {NULL, no_argument, NULL, 0}
2172 };
2173 size_t md_longopts_size = sizeof (md_longopts);
2174
2175 enum float_abi {
2176 FLOAT_ABI_DEFAULT = -1,
2177 FLOAT_ABI_SOFT,
2178 FLOAT_ABI_SINGLE,
2179 FLOAT_ABI_DOUBLE,
2180 FLOAT_ABI_QUAD
2181 };
2182 static enum float_abi float_abi = FLOAT_ABI_DEFAULT;
2183
2184 static void
2185 riscv_set_abi (unsigned new_xlen, enum float_abi new_float_abi, bfd_boolean rve)
2186 {
2187 abi_xlen = new_xlen;
2188 float_abi = new_float_abi;
2189 rve_abi = rve;
2190 }
2191
2192 int
2193 md_parse_option (int c, const char *arg)
2194 {
2195 switch (c)
2196 {
2197 case OPTION_MARCH:
2198 riscv_set_arch (arg);
2199 break;
2200
2201 case OPTION_NO_PIC:
2202 riscv_opts.pic = FALSE;
2203 break;
2204
2205 case OPTION_PIC:
2206 riscv_opts.pic = TRUE;
2207 break;
2208
2209 case OPTION_MABI:
2210 if (strcmp (arg, "ilp32") == 0)
2211 riscv_set_abi (32, FLOAT_ABI_SOFT, FALSE);
2212 else if (strcmp (arg, "ilp32e") == 0)
2213 riscv_set_abi (32, FLOAT_ABI_SOFT, TRUE);
2214 else if (strcmp (arg, "ilp32f") == 0)
2215 riscv_set_abi (32, FLOAT_ABI_SINGLE, FALSE);
2216 else if (strcmp (arg, "ilp32d") == 0)
2217 riscv_set_abi (32, FLOAT_ABI_DOUBLE, FALSE);
2218 else if (strcmp (arg, "ilp32q") == 0)
2219 riscv_set_abi (32, FLOAT_ABI_QUAD, FALSE);
2220 else if (strcmp (arg, "lp64") == 0)
2221 riscv_set_abi (64, FLOAT_ABI_SOFT, FALSE);
2222 else if (strcmp (arg, "lp64f") == 0)
2223 riscv_set_abi (64, FLOAT_ABI_SINGLE, FALSE);
2224 else if (strcmp (arg, "lp64d") == 0)
2225 riscv_set_abi (64, FLOAT_ABI_DOUBLE, FALSE);
2226 else if (strcmp (arg, "lp64q") == 0)
2227 riscv_set_abi (64, FLOAT_ABI_QUAD, FALSE);
2228 else
2229 return 0;
2230 break;
2231
2232 case OPTION_RELAX:
2233 riscv_opts.relax = TRUE;
2234 break;
2235
2236 case OPTION_NO_RELAX:
2237 riscv_opts.relax = FALSE;
2238 break;
2239
2240 case OPTION_ARCH_ATTR:
2241 riscv_opts.arch_attr = TRUE;
2242 break;
2243
2244 case OPTION_NO_ARCH_ATTR:
2245 riscv_opts.arch_attr = FALSE;
2246 break;
2247
2248 default:
2249 return 0;
2250 }
2251
2252 return 1;
2253 }
2254
2255 void
2256 riscv_after_parse_args (void)
2257 {
2258 if (xlen == 0)
2259 {
2260 if (strcmp (default_arch, "riscv32") == 0)
2261 xlen = 32;
2262 else if (strcmp (default_arch, "riscv64") == 0)
2263 xlen = 64;
2264 else
2265 as_bad ("unknown default architecture `%s'", default_arch);
2266 }
2267
2268 if (riscv_subsets.head == NULL)
2269 riscv_set_arch (xlen == 64 ? "rv64g" : "rv32g");
2270
2271 /* Add the RVC extension, regardless of -march, to support .option rvc. */
2272 riscv_set_rvc (FALSE);
2273 if (riscv_subset_supports ("c"))
2274 riscv_set_rvc (TRUE);
2275
2276 /* Enable RVE if specified by the -march option. */
2277 riscv_set_rve (FALSE);
2278 if (riscv_subset_supports ("e"))
2279 riscv_set_rve (TRUE);
2280
2281 /* Infer ABI from ISA if not specified on command line. */
2282 if (abi_xlen == 0)
2283 abi_xlen = xlen;
2284 else if (abi_xlen > xlen)
2285 as_bad ("can't have %d-bit ABI on %d-bit ISA", abi_xlen, xlen);
2286 else if (abi_xlen < xlen)
2287 as_bad ("%d-bit ABI not yet supported on %d-bit ISA", abi_xlen, xlen);
2288
2289 if (float_abi == FLOAT_ABI_DEFAULT)
2290 {
2291 riscv_subset_t *subset;
2292
2293 /* Assume soft-float unless D extension is present. */
2294 float_abi = FLOAT_ABI_SOFT;
2295
2296 for (subset = riscv_subsets.head; subset != NULL; subset = subset->next)
2297 {
2298 if (strcasecmp (subset->name, "D") == 0)
2299 float_abi = FLOAT_ABI_DOUBLE;
2300 if (strcasecmp (subset->name, "Q") == 0)
2301 float_abi = FLOAT_ABI_QUAD;
2302 }
2303 }
2304
2305 if (rve_abi)
2306 elf_flags |= EF_RISCV_RVE;
2307
2308 /* Insert float_abi into the EF_RISCV_FLOAT_ABI field of elf_flags. */
2309 elf_flags |= float_abi * (EF_RISCV_FLOAT_ABI & ~(EF_RISCV_FLOAT_ABI << 1));
2310 }
2311
2312 long
2313 md_pcrel_from (fixS *fixP)
2314 {
2315 return fixP->fx_where + fixP->fx_frag->fr_address;
2316 }
2317
2318 /* Apply a fixup to the object file. */
2319
2320 void
2321 md_apply_fix (fixS *fixP, valueT *valP, segT seg ATTRIBUTE_UNUSED)
2322 {
2323 unsigned int subtype;
2324 bfd_byte *buf = (bfd_byte *) (fixP->fx_frag->fr_literal + fixP->fx_where);
2325 bfd_boolean relaxable = FALSE;
2326 offsetT loc;
2327 segT sub_segment;
2328
2329 /* Remember value for tc_gen_reloc. */
2330 fixP->fx_addnumber = *valP;
2331
2332 switch (fixP->fx_r_type)
2333 {
2334 case BFD_RELOC_RISCV_HI20:
2335 case BFD_RELOC_RISCV_LO12_I:
2336 case BFD_RELOC_RISCV_LO12_S:
2337 bfd_putl32 (riscv_apply_const_reloc (fixP->fx_r_type, *valP)
2338 | bfd_getl32 (buf), buf);
2339 if (fixP->fx_addsy == NULL)
2340 fixP->fx_done = TRUE;
2341 relaxable = TRUE;
2342 break;
2343
2344 case BFD_RELOC_RISCV_GOT_HI20:
2345 case BFD_RELOC_RISCV_ADD8:
2346 case BFD_RELOC_RISCV_ADD16:
2347 case BFD_RELOC_RISCV_ADD32:
2348 case BFD_RELOC_RISCV_ADD64:
2349 case BFD_RELOC_RISCV_SUB6:
2350 case BFD_RELOC_RISCV_SUB8:
2351 case BFD_RELOC_RISCV_SUB16:
2352 case BFD_RELOC_RISCV_SUB32:
2353 case BFD_RELOC_RISCV_SUB64:
2354 case BFD_RELOC_RISCV_RELAX:
2355 break;
2356
2357 case BFD_RELOC_RISCV_TPREL_HI20:
2358 case BFD_RELOC_RISCV_TPREL_LO12_I:
2359 case BFD_RELOC_RISCV_TPREL_LO12_S:
2360 case BFD_RELOC_RISCV_TPREL_ADD:
2361 relaxable = TRUE;
2362 /* Fall through. */
2363
2364 case BFD_RELOC_RISCV_TLS_GOT_HI20:
2365 case BFD_RELOC_RISCV_TLS_GD_HI20:
2366 case BFD_RELOC_RISCV_TLS_DTPREL32:
2367 case BFD_RELOC_RISCV_TLS_DTPREL64:
2368 if (fixP->fx_addsy != NULL)
2369 S_SET_THREAD_LOCAL (fixP->fx_addsy);
2370 else
2371 as_bad_where (fixP->fx_file, fixP->fx_line,
2372 _("TLS relocation against a constant"));
2373 break;
2374
2375 case BFD_RELOC_32:
2376 /* Use pc-relative relocation for FDE initial location.
2377 The symbol address in .eh_frame may be adjusted in
2378 _bfd_elf_discard_section_eh_frame, and the content of
2379 .eh_frame will be adjusted in _bfd_elf_write_section_eh_frame.
2380 Therefore, we cannot insert a relocation whose addend symbol is
2381 in .eh_frame. Othrewise, the value may be adjusted twice.*/
2382 if (fixP->fx_addsy && fixP->fx_subsy
2383 && (sub_segment = S_GET_SEGMENT (fixP->fx_subsy))
2384 && strcmp (sub_segment->name, ".eh_frame") == 0
2385 && S_GET_VALUE (fixP->fx_subsy)
2386 == fixP->fx_frag->fr_address + fixP->fx_where)
2387 {
2388 fixP->fx_r_type = BFD_RELOC_RISCV_32_PCREL;
2389 fixP->fx_subsy = NULL;
2390 break;
2391 }
2392 /* Fall through. */
2393 case BFD_RELOC_64:
2394 case BFD_RELOC_16:
2395 case BFD_RELOC_8:
2396 case BFD_RELOC_RISCV_CFA:
2397 if (fixP->fx_addsy && fixP->fx_subsy)
2398 {
2399 fixP->fx_next = xmemdup (fixP, sizeof (*fixP), sizeof (*fixP));
2400 fixP->fx_next->fx_addsy = fixP->fx_subsy;
2401 fixP->fx_next->fx_subsy = NULL;
2402 fixP->fx_next->fx_offset = 0;
2403 fixP->fx_subsy = NULL;
2404
2405 switch (fixP->fx_r_type)
2406 {
2407 case BFD_RELOC_64:
2408 fixP->fx_r_type = BFD_RELOC_RISCV_ADD64;
2409 fixP->fx_next->fx_r_type = BFD_RELOC_RISCV_SUB64;
2410 break;
2411
2412 case BFD_RELOC_32:
2413 fixP->fx_r_type = BFD_RELOC_RISCV_ADD32;
2414 fixP->fx_next->fx_r_type = BFD_RELOC_RISCV_SUB32;
2415 break;
2416
2417 case BFD_RELOC_16:
2418 fixP->fx_r_type = BFD_RELOC_RISCV_ADD16;
2419 fixP->fx_next->fx_r_type = BFD_RELOC_RISCV_SUB16;
2420 break;
2421
2422 case BFD_RELOC_8:
2423 fixP->fx_r_type = BFD_RELOC_RISCV_ADD8;
2424 fixP->fx_next->fx_r_type = BFD_RELOC_RISCV_SUB8;
2425 break;
2426
2427 case BFD_RELOC_RISCV_CFA:
2428 /* Load the byte to get the subtype. */
2429 subtype = bfd_get_8 (NULL, &((fragS *) (fixP->fx_frag->fr_opcode))->fr_literal[fixP->fx_where]);
2430 loc = fixP->fx_frag->fr_fix - (subtype & 7);
2431 switch (subtype)
2432 {
2433 case DW_CFA_advance_loc1:
2434 fixP->fx_where = loc + 1;
2435 fixP->fx_next->fx_where = loc + 1;
2436 fixP->fx_r_type = BFD_RELOC_RISCV_SET8;
2437 fixP->fx_next->fx_r_type = BFD_RELOC_RISCV_SUB8;
2438 break;
2439
2440 case DW_CFA_advance_loc2:
2441 fixP->fx_size = 2;
2442 fixP->fx_next->fx_size = 2;
2443 fixP->fx_where = loc + 1;
2444 fixP->fx_next->fx_where = loc + 1;
2445 fixP->fx_r_type = BFD_RELOC_RISCV_SET16;
2446 fixP->fx_next->fx_r_type = BFD_RELOC_RISCV_SUB16;
2447 break;
2448
2449 case DW_CFA_advance_loc4:
2450 fixP->fx_size = 4;
2451 fixP->fx_next->fx_size = 4;
2452 fixP->fx_where = loc;
2453 fixP->fx_next->fx_where = loc;
2454 fixP->fx_r_type = BFD_RELOC_RISCV_SET32;
2455 fixP->fx_next->fx_r_type = BFD_RELOC_RISCV_SUB32;
2456 break;
2457
2458 default:
2459 if (subtype < 0x80 && (subtype & 0x40))
2460 {
2461 /* DW_CFA_advance_loc */
2462 fixP->fx_frag = (fragS *) fixP->fx_frag->fr_opcode;
2463 fixP->fx_next->fx_frag = fixP->fx_frag;
2464 fixP->fx_r_type = BFD_RELOC_RISCV_SET6;
2465 fixP->fx_next->fx_r_type = BFD_RELOC_RISCV_SUB6;
2466 }
2467 else
2468 as_fatal (_("internal error: bad CFA value #%d"), subtype);
2469 break;
2470 }
2471 break;
2472
2473 default:
2474 /* This case is unreachable. */
2475 abort ();
2476 }
2477 }
2478 /* Fall through. */
2479
2480 case BFD_RELOC_RVA:
2481 /* If we are deleting this reloc entry, we must fill in the
2482 value now. This can happen if we have a .word which is not
2483 resolved when it appears but is later defined. */
2484 if (fixP->fx_addsy == NULL)
2485 {
2486 gas_assert (fixP->fx_size <= sizeof (valueT));
2487 md_number_to_chars ((char *) buf, *valP, fixP->fx_size);
2488 fixP->fx_done = 1;
2489 }
2490 break;
2491
2492 case BFD_RELOC_RISCV_JMP:
2493 if (fixP->fx_addsy)
2494 {
2495 /* Fill in a tentative value to improve objdump readability. */
2496 bfd_vma target = S_GET_VALUE (fixP->fx_addsy) + *valP;
2497 bfd_vma delta = target - md_pcrel_from (fixP);
2498 bfd_putl32 (bfd_getl32 (buf) | ENCODE_UJTYPE_IMM (delta), buf);
2499 }
2500 break;
2501
2502 case BFD_RELOC_12_PCREL:
2503 if (fixP->fx_addsy)
2504 {
2505 /* Fill in a tentative value to improve objdump readability. */
2506 bfd_vma target = S_GET_VALUE (fixP->fx_addsy) + *valP;
2507 bfd_vma delta = target - md_pcrel_from (fixP);
2508 bfd_putl32 (bfd_getl32 (buf) | ENCODE_SBTYPE_IMM (delta), buf);
2509 }
2510 break;
2511
2512 case BFD_RELOC_RISCV_RVC_BRANCH:
2513 if (fixP->fx_addsy)
2514 {
2515 /* Fill in a tentative value to improve objdump readability. */
2516 bfd_vma target = S_GET_VALUE (fixP->fx_addsy) + *valP;
2517 bfd_vma delta = target - md_pcrel_from (fixP);
2518 bfd_putl16 (bfd_getl16 (buf) | ENCODE_RVC_B_IMM (delta), buf);
2519 }
2520 break;
2521
2522 case BFD_RELOC_RISCV_RVC_JUMP:
2523 if (fixP->fx_addsy)
2524 {
2525 /* Fill in a tentative value to improve objdump readability. */
2526 bfd_vma target = S_GET_VALUE (fixP->fx_addsy) + *valP;
2527 bfd_vma delta = target - md_pcrel_from (fixP);
2528 bfd_putl16 (bfd_getl16 (buf) | ENCODE_RVC_J_IMM (delta), buf);
2529 }
2530 break;
2531
2532 case BFD_RELOC_RISCV_CALL:
2533 case BFD_RELOC_RISCV_CALL_PLT:
2534 relaxable = TRUE;
2535 break;
2536
2537 case BFD_RELOC_RISCV_PCREL_HI20:
2538 case BFD_RELOC_RISCV_PCREL_LO12_S:
2539 case BFD_RELOC_RISCV_PCREL_LO12_I:
2540 relaxable = riscv_opts.relax;
2541 break;
2542
2543 case BFD_RELOC_RISCV_ALIGN:
2544 break;
2545
2546 default:
2547 /* We ignore generic BFD relocations we don't know about. */
2548 if (bfd_reloc_type_lookup (stdoutput, fixP->fx_r_type) != NULL)
2549 as_fatal (_("internal error: bad relocation #%d"), fixP->fx_r_type);
2550 }
2551
2552 if (fixP->fx_subsy != NULL)
2553 as_bad_where (fixP->fx_file, fixP->fx_line,
2554 _("unsupported symbol subtraction"));
2555
2556 /* Add an R_RISCV_RELAX reloc if the reloc is relaxable. */
2557 if (relaxable && fixP->fx_tcbit && fixP->fx_addsy != NULL)
2558 {
2559 fixP->fx_next = xmemdup (fixP, sizeof (*fixP), sizeof (*fixP));
2560 fixP->fx_next->fx_addsy = fixP->fx_next->fx_subsy = NULL;
2561 fixP->fx_next->fx_r_type = BFD_RELOC_RISCV_RELAX;
2562 }
2563 }
2564
2565 /* Because the value of .cfi_remember_state may changed after relaxation,
2566 we insert a fix to relocate it again in link-time. */
2567
2568 void
2569 riscv_pre_output_hook (void)
2570 {
2571 const frchainS *frch;
2572 const asection *s;
2573
2574 for (s = stdoutput->sections; s; s = s->next)
2575 for (frch = seg_info (s)->frchainP; frch; frch = frch->frch_next)
2576 {
2577 fragS *frag;
2578
2579 for (frag = frch->frch_root; frag; frag = frag->fr_next)
2580 {
2581 if (frag->fr_type == rs_cfa)
2582 {
2583 expressionS exp;
2584 expressionS *symval;
2585
2586 symval = symbol_get_value_expression (frag->fr_symbol);
2587 exp.X_op = O_subtract;
2588 exp.X_add_symbol = symval->X_add_symbol;
2589 exp.X_add_number = 0;
2590 exp.X_op_symbol = symval->X_op_symbol;
2591
2592 fix_new_exp (frag, (int) frag->fr_offset, 1, &exp, 0,
2593 BFD_RELOC_RISCV_CFA);
2594 }
2595 }
2596 }
2597 }
2598
2599
2600 /* This structure is used to hold a stack of .option values. */
2601
2602 struct riscv_option_stack
2603 {
2604 struct riscv_option_stack *next;
2605 struct riscv_set_options options;
2606 };
2607
2608 static struct riscv_option_stack *riscv_opts_stack;
2609
2610 /* Handle the .option pseudo-op. */
2611
2612 static void
2613 s_riscv_option (int x ATTRIBUTE_UNUSED)
2614 {
2615 char *name = input_line_pointer, ch;
2616
2617 while (!is_end_of_line[(unsigned char) *input_line_pointer])
2618 ++input_line_pointer;
2619 ch = *input_line_pointer;
2620 *input_line_pointer = '\0';
2621
2622 if (strcmp (name, "rvc") == 0)
2623 riscv_set_rvc (TRUE);
2624 else if (strcmp (name, "norvc") == 0)
2625 riscv_set_rvc (FALSE);
2626 else if (strcmp (name, "pic") == 0)
2627 riscv_opts.pic = TRUE;
2628 else if (strcmp (name, "nopic") == 0)
2629 riscv_opts.pic = FALSE;
2630 else if (strcmp (name, "relax") == 0)
2631 riscv_opts.relax = TRUE;
2632 else if (strcmp (name, "norelax") == 0)
2633 riscv_opts.relax = FALSE;
2634 else if (strcmp (name, "push") == 0)
2635 {
2636 struct riscv_option_stack *s;
2637
2638 s = (struct riscv_option_stack *) xmalloc (sizeof *s);
2639 s->next = riscv_opts_stack;
2640 s->options = riscv_opts;
2641 riscv_opts_stack = s;
2642 }
2643 else if (strcmp (name, "pop") == 0)
2644 {
2645 struct riscv_option_stack *s;
2646
2647 s = riscv_opts_stack;
2648 if (s == NULL)
2649 as_bad (_(".option pop with no .option push"));
2650 else
2651 {
2652 riscv_opts = s->options;
2653 riscv_opts_stack = s->next;
2654 free (s);
2655 }
2656 }
2657 else
2658 {
2659 as_warn (_("Unrecognized .option directive: %s\n"), name);
2660 }
2661 *input_line_pointer = ch;
2662 demand_empty_rest_of_line ();
2663 }
2664
2665 /* Handle the .dtprelword and .dtpreldword pseudo-ops. They generate
2666 a 32-bit or 64-bit DTP-relative relocation (BYTES says which) for
2667 use in DWARF debug information. */
2668
2669 static void
2670 s_dtprel (int bytes)
2671 {
2672 expressionS ex;
2673 char *p;
2674
2675 expression (&ex);
2676
2677 if (ex.X_op != O_symbol)
2678 {
2679 as_bad (_("Unsupported use of %s"), (bytes == 8
2680 ? ".dtpreldword"
2681 : ".dtprelword"));
2682 ignore_rest_of_line ();
2683 }
2684
2685 p = frag_more (bytes);
2686 md_number_to_chars (p, 0, bytes);
2687 fix_new_exp (frag_now, p - frag_now->fr_literal, bytes, &ex, FALSE,
2688 (bytes == 8
2689 ? BFD_RELOC_RISCV_TLS_DTPREL64
2690 : BFD_RELOC_RISCV_TLS_DTPREL32));
2691
2692 demand_empty_rest_of_line ();
2693 }
2694
2695 /* Handle the .bss pseudo-op. */
2696
2697 static void
2698 s_bss (int ignore ATTRIBUTE_UNUSED)
2699 {
2700 subseg_set (bss_section, 0);
2701 demand_empty_rest_of_line ();
2702 }
2703
2704 static void
2705 riscv_make_nops (char *buf, bfd_vma bytes)
2706 {
2707 bfd_vma i = 0;
2708
2709 /* RISC-V instructions cannot begin or end on odd addresses, so this case
2710 means we are not within a valid instruction sequence. It is thus safe
2711 to use a zero byte, even though that is not a valid instruction. */
2712 if (bytes % 2 == 1)
2713 buf[i++] = 0;
2714
2715 /* Use at most one 2-byte NOP. */
2716 if ((bytes - i) % 4 == 2)
2717 {
2718 md_number_to_chars (buf + i, RVC_NOP, 2);
2719 i += 2;
2720 }
2721
2722 /* Fill the remainder with 4-byte NOPs. */
2723 for ( ; i < bytes; i += 4)
2724 md_number_to_chars (buf + i, RISCV_NOP, 4);
2725 }
2726
2727 /* Called from md_do_align. Used to create an alignment frag in a
2728 code section by emitting a worst-case NOP sequence that the linker
2729 will later relax to the correct number of NOPs. We can't compute
2730 the correct alignment now because of other linker relaxations. */
2731
2732 bfd_boolean
2733 riscv_frag_align_code (int n)
2734 {
2735 bfd_vma bytes = (bfd_vma) 1 << n;
2736 bfd_vma insn_alignment = riscv_opts.rvc ? 2 : 4;
2737 bfd_vma worst_case_bytes = bytes - insn_alignment;
2738 char *nops;
2739 expressionS ex;
2740
2741 /* If we are moving to a smaller alignment than the instruction size, then no
2742 alignment is required. */
2743 if (bytes <= insn_alignment)
2744 return TRUE;
2745
2746 /* When not relaxing, riscv_handle_align handles code alignment. */
2747 if (!riscv_opts.relax)
2748 return FALSE;
2749
2750 nops = frag_more (worst_case_bytes);
2751
2752 ex.X_op = O_constant;
2753 ex.X_add_number = worst_case_bytes;
2754
2755 riscv_make_nops (nops, worst_case_bytes);
2756
2757 fix_new_exp (frag_now, nops - frag_now->fr_literal, 0,
2758 &ex, FALSE, BFD_RELOC_RISCV_ALIGN);
2759
2760 return TRUE;
2761 }
2762
2763 /* Implement HANDLE_ALIGN. */
2764
2765 void
2766 riscv_handle_align (fragS *fragP)
2767 {
2768 switch (fragP->fr_type)
2769 {
2770 case rs_align_code:
2771 /* When relaxing, riscv_frag_align_code handles code alignment. */
2772 if (!riscv_opts.relax)
2773 {
2774 bfd_signed_vma bytes = (fragP->fr_next->fr_address
2775 - fragP->fr_address - fragP->fr_fix);
2776 /* We have 4 byte uncompressed nops. */
2777 bfd_signed_vma size = 4;
2778 bfd_signed_vma excess = bytes % size;
2779 char *p = fragP->fr_literal + fragP->fr_fix;
2780
2781 if (bytes <= 0)
2782 break;
2783
2784 /* Insert zeros or compressed nops to get 4 byte alignment. */
2785 if (excess)
2786 {
2787 riscv_make_nops (p, excess);
2788 fragP->fr_fix += excess;
2789 p += excess;
2790 }
2791
2792 /* Insert variable number of 4 byte uncompressed nops. */
2793 riscv_make_nops (p, size);
2794 fragP->fr_var = size;
2795 }
2796 break;
2797
2798 default:
2799 break;
2800 }
2801 }
2802
2803 int
2804 md_estimate_size_before_relax (fragS *fragp, asection *segtype)
2805 {
2806 return (fragp->fr_var = relaxed_branch_length (fragp, segtype, FALSE));
2807 }
2808
2809 /* Translate internal representation of relocation info to BFD target
2810 format. */
2811
2812 arelent *
2813 tc_gen_reloc (asection *section ATTRIBUTE_UNUSED, fixS *fixp)
2814 {
2815 arelent *reloc = (arelent *) xmalloc (sizeof (arelent));
2816
2817 reloc->sym_ptr_ptr = (asymbol **) xmalloc (sizeof (asymbol *));
2818 *reloc->sym_ptr_ptr = symbol_get_bfdsym (fixp->fx_addsy);
2819 reloc->address = fixp->fx_frag->fr_address + fixp->fx_where;
2820 reloc->addend = fixp->fx_addnumber;
2821
2822 reloc->howto = bfd_reloc_type_lookup (stdoutput, fixp->fx_r_type);
2823 if (reloc->howto == NULL)
2824 {
2825 if ((fixp->fx_r_type == BFD_RELOC_16 || fixp->fx_r_type == BFD_RELOC_8)
2826 && fixp->fx_addsy != NULL && fixp->fx_subsy != NULL)
2827 {
2828 /* We don't have R_RISCV_8/16, but for this special case,
2829 we can use R_RISCV_ADD8/16 with R_RISCV_SUB8/16. */
2830 return reloc;
2831 }
2832
2833 as_bad_where (fixp->fx_file, fixp->fx_line,
2834 _("cannot represent %s relocation in object file"),
2835 bfd_get_reloc_code_name (fixp->fx_r_type));
2836 return NULL;
2837 }
2838
2839 return reloc;
2840 }
2841
2842 int
2843 riscv_relax_frag (asection *sec, fragS *fragp, long stretch ATTRIBUTE_UNUSED)
2844 {
2845 if (RELAX_BRANCH_P (fragp->fr_subtype))
2846 {
2847 offsetT old_var = fragp->fr_var;
2848 fragp->fr_var = relaxed_branch_length (fragp, sec, TRUE);
2849 return fragp->fr_var - old_var;
2850 }
2851
2852 return 0;
2853 }
2854
2855 /* Expand far branches to multi-instruction sequences. */
2856
2857 static void
2858 md_convert_frag_branch (fragS *fragp)
2859 {
2860 bfd_byte *buf;
2861 expressionS exp;
2862 fixS *fixp;
2863 insn_t insn;
2864 int rs1, reloc;
2865
2866 buf = (bfd_byte *)fragp->fr_literal + fragp->fr_fix;
2867
2868 exp.X_op = O_symbol;
2869 exp.X_add_symbol = fragp->fr_symbol;
2870 exp.X_add_number = fragp->fr_offset;
2871
2872 gas_assert (fragp->fr_var == RELAX_BRANCH_LENGTH (fragp->fr_subtype));
2873
2874 if (RELAX_BRANCH_RVC (fragp->fr_subtype))
2875 {
2876 switch (RELAX_BRANCH_LENGTH (fragp->fr_subtype))
2877 {
2878 case 8:
2879 case 4:
2880 /* Expand the RVC branch into a RISC-V one. */
2881 insn = bfd_getl16 (buf);
2882 rs1 = 8 + ((insn >> OP_SH_CRS1S) & OP_MASK_CRS1S);
2883 if ((insn & MASK_C_J) == MATCH_C_J)
2884 insn = MATCH_JAL;
2885 else if ((insn & MASK_C_JAL) == MATCH_C_JAL)
2886 insn = MATCH_JAL | (X_RA << OP_SH_RD);
2887 else if ((insn & MASK_C_BEQZ) == MATCH_C_BEQZ)
2888 insn = MATCH_BEQ | (rs1 << OP_SH_RS1);
2889 else if ((insn & MASK_C_BNEZ) == MATCH_C_BNEZ)
2890 insn = MATCH_BNE | (rs1 << OP_SH_RS1);
2891 else
2892 abort ();
2893 bfd_putl32 (insn, buf);
2894 break;
2895
2896 case 6:
2897 /* Invert the branch condition. Branch over the jump. */
2898 insn = bfd_getl16 (buf);
2899 insn ^= MATCH_C_BEQZ ^ MATCH_C_BNEZ;
2900 insn |= ENCODE_RVC_B_IMM (6);
2901 bfd_putl16 (insn, buf);
2902 buf += 2;
2903 goto jump;
2904
2905 case 2:
2906 /* Just keep the RVC branch. */
2907 reloc = RELAX_BRANCH_UNCOND (fragp->fr_subtype)
2908 ? BFD_RELOC_RISCV_RVC_JUMP : BFD_RELOC_RISCV_RVC_BRANCH;
2909 fixp = fix_new_exp (fragp, buf - (bfd_byte *)fragp->fr_literal,
2910 2, &exp, FALSE, reloc);
2911 buf += 2;
2912 goto done;
2913
2914 default:
2915 abort ();
2916 }
2917 }
2918
2919 switch (RELAX_BRANCH_LENGTH (fragp->fr_subtype))
2920 {
2921 case 8:
2922 gas_assert (!RELAX_BRANCH_UNCOND (fragp->fr_subtype));
2923
2924 /* Invert the branch condition. Branch over the jump. */
2925 insn = bfd_getl32 (buf);
2926 insn ^= MATCH_BEQ ^ MATCH_BNE;
2927 insn |= ENCODE_SBTYPE_IMM (8);
2928 md_number_to_chars ((char *) buf, insn, 4);
2929 buf += 4;
2930
2931 jump:
2932 /* Jump to the target. */
2933 fixp = fix_new_exp (fragp, buf - (bfd_byte *)fragp->fr_literal,
2934 4, &exp, FALSE, BFD_RELOC_RISCV_JMP);
2935 md_number_to_chars ((char *) buf, MATCH_JAL, 4);
2936 buf += 4;
2937 break;
2938
2939 case 4:
2940 reloc = RELAX_BRANCH_UNCOND (fragp->fr_subtype)
2941 ? BFD_RELOC_RISCV_JMP : BFD_RELOC_12_PCREL;
2942 fixp = fix_new_exp (fragp, buf - (bfd_byte *)fragp->fr_literal,
2943 4, &exp, FALSE, reloc);
2944 buf += 4;
2945 break;
2946
2947 default:
2948 abort ();
2949 }
2950
2951 done:
2952 fixp->fx_file = fragp->fr_file;
2953 fixp->fx_line = fragp->fr_line;
2954
2955 gas_assert (buf == (bfd_byte *)fragp->fr_literal
2956 + fragp->fr_fix + fragp->fr_var);
2957
2958 fragp->fr_fix += fragp->fr_var;
2959 }
2960
2961 /* Relax a machine dependent frag. This returns the amount by which
2962 the current size of the frag should change. */
2963
2964 void
2965 md_convert_frag (bfd *abfd ATTRIBUTE_UNUSED, segT asec ATTRIBUTE_UNUSED,
2966 fragS *fragp)
2967 {
2968 gas_assert (RELAX_BRANCH_P (fragp->fr_subtype));
2969 md_convert_frag_branch (fragp);
2970 }
2971
2972 void
2973 md_show_usage (FILE *stream)
2974 {
2975 fprintf (stream, _("\
2976 RISC-V options:\n\
2977 -fpic generate position-independent code\n\
2978 -fno-pic don't generate position-independent code (default)\n\
2979 -march=ISA set the RISC-V architecture\n\
2980 -mabi=ABI set the RISC-V ABI\n\
2981 -mrelax enable relax (default)\n\
2982 -mno-relax disable relax\n\
2983 -march-attr generate RISC-V arch attribute\n\
2984 -mno-arch-attr don't generate RISC-V arch attribute\n\
2985 "));
2986 }
2987
2988 /* Standard calling conventions leave the CFA at SP on entry. */
2989 void
2990 riscv_cfi_frame_initial_instructions (void)
2991 {
2992 cfi_add_CFA_def_cfa_register (X_SP);
2993 }
2994
2995 int
2996 tc_riscv_regname_to_dw2regnum (char *regname)
2997 {
2998 int reg;
2999
3000 if ((reg = reg_lookup_internal (regname, RCLASS_GPR)) >= 0)
3001 return reg;
3002
3003 if ((reg = reg_lookup_internal (regname, RCLASS_FPR)) >= 0)
3004 return reg + 32;
3005
3006 as_bad (_("unknown register `%s'"), regname);
3007 return -1;
3008 }
3009
3010 void
3011 riscv_elf_final_processing (void)
3012 {
3013 elf_elfheader (stdoutput)->e_flags |= elf_flags;
3014 }
3015
3016 /* Parse the .sleb128 and .uleb128 pseudos. Only allow constant expressions,
3017 since these directives break relaxation when used with symbol deltas. */
3018
3019 static void
3020 s_riscv_leb128 (int sign)
3021 {
3022 expressionS exp;
3023 char *save_in = input_line_pointer;
3024
3025 expression (&exp);
3026 if (exp.X_op != O_constant)
3027 as_bad (_("non-constant .%cleb128 is not supported"), sign ? 's' : 'u');
3028 demand_empty_rest_of_line ();
3029
3030 input_line_pointer = save_in;
3031 return s_leb128 (sign);
3032 }
3033
3034 /* Parse the .insn directive. */
3035
3036 static void
3037 s_riscv_insn (int x ATTRIBUTE_UNUSED)
3038 {
3039 char *str = input_line_pointer;
3040 struct riscv_cl_insn insn;
3041 expressionS imm_expr;
3042 bfd_reloc_code_real_type imm_reloc = BFD_RELOC_UNUSED;
3043 char save_c;
3044
3045 while (!is_end_of_line[(unsigned char) *input_line_pointer])
3046 ++input_line_pointer;
3047
3048 save_c = *input_line_pointer;
3049 *input_line_pointer = '\0';
3050
3051 const char *error = riscv_ip (str, &insn, &imm_expr,
3052 &imm_reloc, insn_type_hash);
3053
3054 if (error)
3055 {
3056 as_bad ("%s `%s'", error, str);
3057 }
3058 else
3059 {
3060 gas_assert (insn.insn_mo->pinfo != INSN_MACRO);
3061 append_insn (&insn, &imm_expr, imm_reloc);
3062 }
3063
3064 *input_line_pointer = save_c;
3065 demand_empty_rest_of_line ();
3066 }
3067
3068 /* Update arch attributes. */
3069
3070 static void
3071 riscv_write_out_arch_attr (void)
3072 {
3073 const char *arch_str = riscv_arch_str (xlen, &riscv_subsets);
3074
3075 bfd_elf_add_proc_attr_string (stdoutput, Tag_RISCV_arch, arch_str);
3076
3077 xfree ((void *)arch_str);
3078 }
3079
3080 /* Add the default contents for the .riscv.attributes section. */
3081
3082 static void
3083 riscv_set_public_attributes (void)
3084 {
3085 if (riscv_opts.arch_attr || explicit_arch_attr)
3086 /* Re-write arch attribute to normalize the arch string. */
3087 riscv_write_out_arch_attr ();
3088 }
3089
3090 /* Called after all assembly has been done. */
3091
3092 void
3093 riscv_md_end (void)
3094 {
3095 riscv_set_public_attributes ();
3096 }
3097
3098 /* Given a symbolic attribute NAME, return the proper integer value.
3099 Returns -1 if the attribute is not known. */
3100
3101 int
3102 riscv_convert_symbolic_attribute (const char *name)
3103 {
3104 static const struct
3105 {
3106 const char * name;
3107 const int tag;
3108 }
3109 attribute_table[] =
3110 {
3111 /* When you modify this table you should
3112 also modify the list in doc/c-riscv.texi. */
3113 #define T(tag) {#tag, Tag_RISCV_##tag}, {"Tag_RISCV_" #tag, Tag_RISCV_##tag}
3114 T(arch),
3115 T(priv_spec),
3116 T(priv_spec_minor),
3117 T(priv_spec_revision),
3118 T(unaligned_access),
3119 T(stack_align),
3120 #undef T
3121 };
3122
3123 unsigned int i;
3124
3125 if (name == NULL)
3126 return -1;
3127
3128 for (i = 0; i < ARRAY_SIZE (attribute_table); i++)
3129 if (strcmp (name, attribute_table[i].name) == 0)
3130 return attribute_table[i].tag;
3131
3132 return -1;
3133 }
3134
3135 /* Parse a .attribute directive. */
3136
3137 static void
3138 s_riscv_attribute (int ignored ATTRIBUTE_UNUSED)
3139 {
3140 int tag = obj_elf_vendor_attribute (OBJ_ATTR_PROC);
3141
3142 if (tag == Tag_RISCV_arch)
3143 {
3144 unsigned old_xlen = xlen;
3145
3146 explicit_arch_attr = TRUE;
3147 obj_attribute *attr;
3148 attr = elf_known_obj_attributes_proc (stdoutput);
3149 if (!start_assemble)
3150 riscv_set_arch (attr[Tag_RISCV_arch].s);
3151 else
3152 as_fatal (_(".attribute arch must set before any instructions"));
3153
3154 if (old_xlen != xlen)
3155 {
3156 /* We must re-init bfd again if xlen is changed. */
3157 unsigned long mach = xlen == 64 ? bfd_mach_riscv64 : bfd_mach_riscv32;
3158 bfd_find_target (riscv_target_format (), stdoutput);
3159
3160 if (! bfd_set_arch_mach (stdoutput, bfd_arch_riscv, mach))
3161 as_warn (_("Could not set architecture and machine"));
3162 }
3163 }
3164 }
3165
3166 /* Pseudo-op table. */
3167
3168 static const pseudo_typeS riscv_pseudo_table[] =
3169 {
3170 /* RISC-V-specific pseudo-ops. */
3171 {"option", s_riscv_option, 0},
3172 {"half", cons, 2},
3173 {"word", cons, 4},
3174 {"dword", cons, 8},
3175 {"dtprelword", s_dtprel, 4},
3176 {"dtpreldword", s_dtprel, 8},
3177 {"bss", s_bss, 0},
3178 {"uleb128", s_riscv_leb128, 0},
3179 {"sleb128", s_riscv_leb128, 1},
3180 {"insn", s_riscv_insn, 0},
3181 {"attribute", s_riscv_attribute, 0},
3182
3183 { NULL, NULL, 0 },
3184 };
3185
3186 void
3187 riscv_pop_insert (void)
3188 {
3189 extern void pop_insert (const pseudo_typeS *);
3190
3191 pop_insert (riscv_pseudo_table);
3192 }