]> git.ipfire.org Git - thirdparty/glibc.git/blob - sysdeps/sparc/sparc64/dl-machine.h
Update.
[thirdparty/glibc.git] / sysdeps / sparc / sparc64 / dl-machine.h
1 /* Machine-dependent ELF dynamic relocation inline functions. Sparc64 version.
2 Copyright (C) 1997, 1998, 1999, 2000, 2001 Free Software Foundation, Inc.
3 This file is part of the GNU C Library.
4
5 The GNU C Library is free software; you can redistribute it and/or
6 modify it under the terms of the GNU Lesser General Public
7 License as published by the Free Software Foundation; either
8 version 2.1 of the License, or (at your option) any later version.
9
10 The GNU C Library is distributed in the hope that it will be useful,
11 but WITHOUT ANY WARRANTY; without even the implied warranty of
12 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
13 Lesser General Public License for more details.
14
15 You should have received a copy of the GNU Lesser General Public
16 License along with the GNU C Library; if not, write to the Free
17 Software Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA
18 02111-1307 USA. */
19
20 #define ELF_MACHINE_NAME "sparc64"
21
22 #include <string.h>
23 #include <sys/param.h>
24 #include <ldsodefs.h>
25 #include <sysdep.h>
26
27 #define ELF64_R_TYPE_ID(info) ((info) & 0xff)
28 #define ELF64_R_TYPE_DATA(info) ((info) >> 8)
29
30 /* Return nonzero iff ELF header is compatible with the running host. */
31 static inline int
32 elf_machine_matches_host (const Elf64_Ehdr *ehdr)
33 {
34 return ehdr->e_machine == EM_SPARCV9;
35 }
36
37 /* Return the link-time address of _DYNAMIC. Conveniently, this is the
38 first element of the GOT. This must be inlined in a function which
39 uses global data. */
40 static inline Elf64_Addr
41 elf_machine_dynamic (void)
42 {
43 register Elf64_Addr *elf_pic_register __asm__("%l7");
44
45 return *elf_pic_register;
46 }
47
48 /* Return the run-time load address of the shared object. */
49 static inline Elf64_Addr
50 elf_machine_load_address (void)
51 {
52 register Elf64_Addr *elf_pic_register __asm__("%l7");
53
54 /* We used to utilize the fact that a local .got entry will
55 be partially initialized at startup awaiting its RELATIVE
56 fixup:
57
58 Elf64_Addr pc, la;
59
60 __asm("sethi %%hi(.Load_address), %1\n"
61 ".Load_address:\n\t"
62 "rd %%pc, %0\n\t"
63 "or %1, %%lo(.Load_address), %1\n\t"
64 : "=r"(pc), "=r"(la));
65
66 return pc - *(Elf64_Addr *)(elf_pic_register + la);
67
68 Unfortunately as binutils tries to work around Solaris
69 dynamic linker bug which resolves R_SPARC_RELATIVE as X += B + A
70 instead of X = B + A this does not work any longer, since ld
71 clears it.
72
73 The following method relies on the fact that sparcv9 ABI maximal
74 page length is 1MB and all ELF segments on sparc64 are aligned
75 to 1MB. Also, it relies on _DYNAMIC coming after _GLOBAL_OFFSET_TABLE_
76 and assumes that they both fit into the first 1MB of the RW segment.
77 This should be true for some time unless ld.so grows too much, at the
78 moment the whole stripped ld.so is 128KB and only smaller part of that
79 is in the RW segment. */
80
81 return ((Elf64_Addr)elf_pic_register - *elf_pic_register + 0xfffff)
82 & ~0xfffffUL;
83 }
84
85 /* We have 4 cases to handle. And we code different code sequences
86 for each one. I love V9 code models... */
87 static inline Elf64_Addr
88 elf_machine_fixup_plt (struct link_map *map, lookup_t t,
89 const Elf64_Rela *reloc,
90 Elf64_Addr *reloc_addr, Elf64_Addr value)
91 {
92 unsigned int *insns = (unsigned int *) reloc_addr;
93 Elf64_Addr plt_vaddr = (Elf64_Addr) reloc_addr;
94
95 /* Now move plt_vaddr up to the call instruction. */
96 plt_vaddr += (2 * 4);
97
98 /* PLT entries .PLT32768 and above look always the same. */
99 if (__builtin_expect (reloc->r_addend, 0) != 0)
100 {
101 *reloc_addr = value - map->l_addr;
102 }
103 /* 32-bit Sparc style, the target is in the lower 32-bits of
104 address space. */
105 else if ((value >> 32) == 0)
106 {
107 /* sethi %hi(target), %g1
108 jmpl %g1 + %lo(target), %g0 */
109
110 insns[2] = 0x81c06000 | (value & 0x3ff);
111 __asm __volatile ("flush %0 + 8" : : "r" (insns));
112
113 insns[1] = 0x03000000 | ((unsigned int)(value >> 10));
114 __asm __volatile ("flush %0 + 4" : : "r" (insns));
115 }
116 /* We can also get somewhat simple sequences if the distance between
117 the target and the PLT entry is within +/- 2GB. */
118 else if ((plt_vaddr > value
119 && ((plt_vaddr - value) >> 32) == 0)
120 || (value > plt_vaddr
121 && ((value - plt_vaddr) >> 32) == 0))
122 {
123 unsigned int displacement;
124
125 if (plt_vaddr > value)
126 displacement = (0 - (plt_vaddr - value));
127 else
128 displacement = value - plt_vaddr;
129
130 /* mov %o7, %g1
131 call displacement
132 mov %g1, %o7 */
133
134 insns[3] = 0x9e100001;
135 __asm __volatile ("flush %0 + 12" : : "r" (insns));
136
137 insns[2] = 0x40000000 | (displacement >> 2);
138 __asm __volatile ("flush %0 + 8" : : "r" (insns));
139
140 insns[1] = 0x8210000f;
141 __asm __volatile ("flush %0 + 4" : : "r" (insns));
142 }
143 /* Worst case, ho hum... */
144 else
145 {
146 unsigned int high32 = (value >> 32);
147 unsigned int low32 = (unsigned int) value;
148
149 /* ??? Some tricks can be stolen from the sparc64 egcs backend
150 constant formation code I wrote. -DaveM */
151
152 /* sethi %hh(value), %g1
153 sethi %lm(value), %g5
154 or %g1, %hm(value), %g1
155 or %g5, %lo(value), %g5
156 sllx %g1, 32, %g1
157 jmpl %g1 + %g5, %g0
158 nop */
159
160 insns[6] = 0x81c04005;
161 __asm __volatile ("flush %0 + 24" : : "r" (insns));
162
163 insns[5] = 0x83287020;
164 __asm __volatile ("flush %0 + 20" : : "r" (insns));
165
166 insns[4] = 0x8a116000 | (low32 & 0x3ff);
167 __asm __volatile ("flush %0 + 16" : : "r" (insns));
168
169 insns[3] = 0x82106000 | (high32 & 0x3ff);
170 __asm __volatile ("flush %0 + 12" : : "r" (insns));
171
172 insns[2] = 0x0b000000 | (low32 >> 10);
173 __asm __volatile ("flush %0 + 8" : : "r" (insns));
174
175 insns[1] = 0x03000000 | (high32 >> 10);
176 __asm __volatile ("flush %0 + 4" : : "r" (insns));
177 }
178
179 return value;
180 }
181
182 /* Return the final value of a plt relocation. */
183 static inline Elf64_Addr
184 elf_machine_plt_value (struct link_map *map, const Elf64_Rela *reloc,
185 Elf64_Addr value)
186 {
187 return value + reloc->r_addend;
188 }
189
190 #ifdef RESOLVE
191
192 /* Perform the relocation specified by RELOC and SYM (which is fully resolved).
193 MAP is the object containing the reloc. */
194
195 static inline void
196 elf_machine_rela (struct link_map *map, const Elf64_Rela *reloc,
197 const Elf64_Sym *sym, const struct r_found_version *version,
198 Elf64_Addr *const reloc_addr)
199 {
200 const unsigned long int r_type = ELF64_R_TYPE_ID (reloc->r_info);
201
202 if (__builtin_expect (r_type == R_SPARC_RELATIVE, 0))
203 *reloc_addr = map->l_addr + reloc->r_addend;
204 #ifndef RTLD_BOOTSTRAP
205 else if (r_type == R_SPARC_NONE) /* Who is Wilbur? */
206 return;
207 #endif
208 else
209 {
210 #ifndef RTLD_BOOTSTRAP
211 const Elf64_Sym *const refsym = sym;
212 #endif
213 Elf64_Addr value;
214 if (sym->st_shndx != SHN_UNDEF &&
215 ELF64_ST_BIND (sym->st_info) == STB_LOCAL)
216 value = map->l_addr;
217 else
218 {
219 value = RESOLVE (&sym, version, r_type);
220 if (sym)
221 value += sym->st_value;
222 }
223 value += reloc->r_addend; /* Assume copy relocs have zero addend. */
224
225 switch (r_type)
226 {
227 #ifndef RTLD_BOOTSTRAP
228 case R_SPARC_COPY:
229 if (sym == NULL)
230 /* This can happen in trace mode if an object could not be
231 found. */
232 break;
233 if (sym->st_size > refsym->st_size
234 || (_dl_verbose && sym->st_size < refsym->st_size))
235 {
236 extern char **_dl_argv;
237 const char *strtab;
238
239 strtab = (const void *) D_PTR (map, l_info[DT_STRTAB]);
240 _dl_error_printf ("\
241 %s: Symbol `%s' has different size in shared object, consider re-linking\n",
242 _dl_argv[0] ?: "<program name unknown>",
243 strtab + refsym->st_name);
244 }
245 memcpy (reloc_addr, (void *) value, MIN (sym->st_size,
246 refsym->st_size));
247 break;
248 #endif
249 case R_SPARC_64:
250 case R_SPARC_GLOB_DAT:
251 *reloc_addr = value;
252 break;
253 #ifndef RTLD_BOOTSTRAP
254 case R_SPARC_8:
255 *(char *) reloc_addr = value;
256 break;
257 case R_SPARC_16:
258 *(short *) reloc_addr = value;
259 break;
260 case R_SPARC_32:
261 *(unsigned int *) reloc_addr = value;
262 break;
263 case R_SPARC_DISP8:
264 *(char *) reloc_addr = (value - (Elf64_Addr) reloc_addr);
265 break;
266 case R_SPARC_DISP16:
267 *(short *) reloc_addr = (value - (Elf64_Addr) reloc_addr);
268 break;
269 case R_SPARC_DISP32:
270 *(unsigned int *) reloc_addr = (value - (Elf64_Addr) reloc_addr);
271 break;
272 case R_SPARC_WDISP30:
273 *(unsigned int *) reloc_addr =
274 ((*(unsigned int *)reloc_addr & 0xc0000000) |
275 ((value - (Elf64_Addr) reloc_addr) >> 2));
276 break;
277
278 /* MEDLOW code model relocs */
279 case R_SPARC_LO10:
280 *(unsigned int *) reloc_addr =
281 ((*(unsigned int *)reloc_addr & ~0x3ff) |
282 (value & 0x3ff));
283 break;
284 case R_SPARC_HI22:
285 *(unsigned int *) reloc_addr =
286 ((*(unsigned int *)reloc_addr & 0xffc00000) |
287 (value >> 10));
288 break;
289 case R_SPARC_OLO10:
290 *(unsigned int *) reloc_addr =
291 ((*(unsigned int *)reloc_addr & ~0x1fff) |
292 (((value & 0x3ff) + ELF64_R_TYPE_DATA (reloc->r_info)) & 0x1fff));
293 break;
294
295 /* MEDMID code model relocs */
296 case R_SPARC_H44:
297 *(unsigned int *) reloc_addr =
298 ((*(unsigned int *)reloc_addr & 0xffc00000) |
299 (value >> 22));
300 break;
301 case R_SPARC_M44:
302 *(unsigned int *) reloc_addr =
303 ((*(unsigned int *)reloc_addr & ~0x3ff) |
304 ((value >> 12) & 0x3ff));
305 break;
306 case R_SPARC_L44:
307 *(unsigned int *) reloc_addr =
308 ((*(unsigned int *)reloc_addr & ~0xfff) |
309 (value & 0xfff));
310 break;
311
312 /* MEDANY code model relocs */
313 case R_SPARC_HH22:
314 *(unsigned int *) reloc_addr =
315 ((*(unsigned int *)reloc_addr & 0xffc00000) |
316 (value >> 42));
317 break;
318 case R_SPARC_HM10:
319 *(unsigned int *) reloc_addr =
320 ((*(unsigned int *)reloc_addr & ~0x3ff) |
321 ((value >> 32) & 0x3ff));
322 break;
323 case R_SPARC_LM22:
324 *(unsigned int *) reloc_addr =
325 ((*(unsigned int *)reloc_addr & 0xffc00000) |
326 ((value >> 10) & 0x003fffff));
327 break;
328 #endif
329 case R_SPARC_JMP_SLOT:
330 elf_machine_fixup_plt(map, 0, reloc, reloc_addr, value);
331 break;
332 #ifndef RTLD_BOOTSTRAP
333 case R_SPARC_UA16:
334 ((unsigned char *) reloc_addr) [0] = value >> 8;
335 ((unsigned char *) reloc_addr) [1] = value;
336 break;
337 case R_SPARC_UA32:
338 ((unsigned char *) reloc_addr) [0] = value >> 24;
339 ((unsigned char *) reloc_addr) [1] = value >> 16;
340 ((unsigned char *) reloc_addr) [2] = value >> 8;
341 ((unsigned char *) reloc_addr) [3] = value;
342 break;
343 case R_SPARC_UA64:
344 if (! ((long) reloc_addr & 3))
345 {
346 /* Common in .eh_frame */
347 ((unsigned int *) reloc_addr) [0] = value >> 32;
348 ((unsigned int *) reloc_addr) [1] = value;
349 break;
350 }
351 ((unsigned char *) reloc_addr) [0] = value >> 56;
352 ((unsigned char *) reloc_addr) [1] = value >> 48;
353 ((unsigned char *) reloc_addr) [2] = value >> 40;
354 ((unsigned char *) reloc_addr) [3] = value >> 32;
355 ((unsigned char *) reloc_addr) [4] = value >> 24;
356 ((unsigned char *) reloc_addr) [5] = value >> 16;
357 ((unsigned char *) reloc_addr) [6] = value >> 8;
358 ((unsigned char *) reloc_addr) [7] = value;
359 break;
360 #endif
361 #if !defined RTLD_BOOTSTRAP || defined _NDEBUG
362 default:
363 _dl_reloc_bad_type (map, r_type, 0);
364 break;
365 #endif
366 }
367 }
368 }
369
370 static inline void
371 elf_machine_rel_relative (Elf64_Addr l_addr, const Elf64_Rel *reloc,
372 Elf64_Addr *const reloc_addr)
373 {
374 *reloc_addr = l_addr + reloc->r_addend;
375 }
376
377 static inline void
378 elf_machine_lazy_rel (struct link_map *map,
379 Elf64_Addr l_addr, const Elf64_Rela *reloc)
380 {
381 switch (ELF64_R_TYPE (reloc->r_info))
382 {
383 case R_SPARC_NONE:
384 break;
385 case R_SPARC_JMP_SLOT:
386 break;
387 default:
388 _dl_reloc_bad_type (map, ELFW(R_TYPE) (reloc->r_info), 1);
389 break;
390 }
391 }
392
393 #endif /* RESOLVE */
394
395 /* Nonzero iff TYPE should not be allowed to resolve to one of
396 the main executable's symbols, as for a COPY reloc. */
397 #define elf_machine_lookup_noexec_p(type) ((type) == R_SPARC_COPY)
398
399 /* Nonzero iff TYPE describes relocation of a PLT entry, so
400 PLT entries should not be allowed to define the value. */
401 #define elf_machine_lookup_noplt_p(type) ((type) == R_SPARC_JMP_SLOT)
402
403 /* A reloc type used for ld.so cmdline arg lookups to reject PLT entries. */
404 #define ELF_MACHINE_JMP_SLOT R_SPARC_JMP_SLOT
405
406 /* The SPARC never uses Elf64_Rel relocations. */
407 #define ELF_MACHINE_NO_REL 1
408
409 /* The SPARC overlaps DT_RELA and DT_PLTREL. */
410 #define ELF_MACHINE_PLTREL_OVERLAP 1
411
412 /* Set up the loaded object described by L so its unrelocated PLT
413 entries will jump to the on-demand fixup code in dl-runtime.c. */
414
415 static inline int
416 elf_machine_runtime_setup (struct link_map *l, int lazy, int profile)
417 {
418 if (l->l_info[DT_JMPREL] && lazy)
419 {
420 extern void _dl_runtime_resolve_0 (void);
421 extern void _dl_runtime_resolve_1 (void);
422 extern void _dl_runtime_profile_0 (void);
423 extern void _dl_runtime_profile_1 (void);
424 Elf64_Addr res0_addr, res1_addr;
425 unsigned int *plt = (void *) D_PTR (l, l_info[DT_PLTGOT]);
426
427 if (! profile)
428 {
429 res0_addr = (Elf64_Addr) &_dl_runtime_resolve_0;
430 res1_addr = (Elf64_Addr) &_dl_runtime_resolve_1;
431 }
432 else
433 {
434 res0_addr = (Elf64_Addr) &_dl_runtime_profile_0;
435 res1_addr = (Elf64_Addr) &_dl_runtime_profile_1;
436 if (_dl_name_match_p (_dl_profile, l))
437 _dl_profile_map = l;
438 }
439
440 /* PLT0 looks like:
441
442 save %sp, -192, %sp
443 sethi %hh(_dl_runtime_{resolve,profile}_0), %l0
444 sethi %lm(_dl_runtime_{resolve,profile}_0), %l1
445 or %l0, %hm(_dl_runtime_{resolve,profile}_0), %l0
446 or %l1, %lo(_dl_runtime_{resolve,profile}_0), %l1
447 sllx %l0, 32, %l0
448 jmpl %l0 + %l1, %l6
449 sethi %hi(0xffc00), %l2
450 */
451
452 plt[0] = 0x9de3bf40;
453 plt[1] = 0x21000000 | (res0_addr >> (64 - 22));
454 plt[2] = 0x23000000 | ((res0_addr >> 10) & 0x003fffff);
455 plt[3] = 0xa0142000 | ((res0_addr >> 32) & 0x3ff);
456 plt[4] = 0xa2146000 | (res0_addr & 0x3ff);
457 plt[5] = 0xa12c3020;
458 plt[6] = 0xadc40011;
459 plt[7] = 0x250003ff;
460
461 /* PLT1 looks like:
462
463 save %sp, -192, %sp
464 sethi %hh(_dl_runtime_{resolve,profile}_1), %l0
465 sethi %lm(_dl_runtime_{resolve,profile}_1), %l1
466 or %l0, %hm(_dl_runtime_{resolve,profile}_1), %l0
467 or %l1, %lo(_dl_runtime_{resolve,profile}_1), %l1
468 sllx %l0, 32, %l0
469 jmpl %l0 + %l1, %l6
470 srlx %g1, 12, %o1
471 */
472
473 plt[8 + 0] = 0x9de3bf40;
474 plt[8 + 1] = 0x21000000 | (res1_addr >> (64 - 22));
475 plt[8 + 2] = 0x23000000 | ((res1_addr >> 10) & 0x003fffff);
476 plt[8 + 3] = 0xa0142000 | ((res1_addr >> 32) & 0x3ff);
477 plt[8 + 4] = 0xa2146000 | (res1_addr & 0x3ff);
478 plt[8 + 5] = 0xa12c3020;
479 plt[8 + 6] = 0xadc40011;
480 plt[8 + 7] = 0x9330700c;
481
482 /* Now put the magic cookie at the beginning of .PLT2
483 Entry .PLT3 is unused by this implementation. */
484 *((struct link_map **)(&plt[16 + 0])) = l;
485 }
486
487 return lazy;
488 }
489
490 /* This code is used in dl-runtime.c to call the `fixup' function
491 and then redirect to the address it returns. */
492 #define TRAMPOLINE_TEMPLATE(tramp_name, fixup_name) \
493 asm ("\n" \
494 " .text\n" \
495 " .globl " #tramp_name "_0\n" \
496 " .type " #tramp_name "_0, @function\n" \
497 " .align 32\n" \
498 "\t" #tramp_name "_0:\n" \
499 " ! sethi %hi(1047552), %l2 - Done in .PLT0\n" \
500 " ldx [%l6 + 32 + 8], %o0\n" \
501 " sub %g1, %l6, %l0\n" \
502 " xor %l2, -1016, %l2\n" \
503 " sethi %hi(5120), %l3 ! 160 * 32\n" \
504 " add %l0, %l2, %l0\n" \
505 " sethi %hi(32768), %l4\n" \
506 " udivx %l0, %l3, %l3\n" \
507 " sllx %l3, 2, %l1\n" \
508 " add %l1, %l3, %l1\n" \
509 " sllx %l1, 10, %l2\n" \
510 " sub %l4, 4, %l4 ! No thanks to Sun for not obeying their own ABI\n" \
511 " sllx %l1, 5, %l1\n" \
512 " sub %l0, %l2, %l0\n" \
513 " udivx %l0, 24, %l0\n" \
514 " add %l0, %l4, %l0\n" \
515 " add %l1, %l0, %l1\n" \
516 " add %l1, %l1, %l0\n" \
517 " add %l0, %l1, %l0\n" \
518 " mov %i7, %o2\n" \
519 " call " #fixup_name "\n" \
520 " sllx %l0, 3, %o1\n" \
521 " jmp %o0\n" \
522 " restore\n" \
523 " .size " #tramp_name "_0, . - " #tramp_name "_0\n" \
524 "\n" \
525 " .globl " #tramp_name "_1\n" \
526 " .type " #tramp_name "_1, @function\n" \
527 " .align 32\n" \
528 "\t" #tramp_name "_1:\n" \
529 " ! srlx %g1, 12, %o1 - Done in .PLT1\n" \
530 " ldx [%l6 + 8], %o0\n" \
531 " add %o1, %o1, %o3\n" \
532 " sub %o1, 96, %o1 ! No thanks to Sun for not obeying their own ABI\n" \
533 " mov %i7, %o2\n" \
534 " call " #fixup_name "\n" \
535 " add %o1, %o3, %o1\n" \
536 " jmp %o0\n" \
537 " restore\n" \
538 " .size " #tramp_name "_1, . - " #tramp_name "_1\n" \
539 " .previous\n");
540
541 #ifndef PROF
542 #define ELF_MACHINE_RUNTIME_TRAMPOLINE \
543 TRAMPOLINE_TEMPLATE (_dl_runtime_resolve, fixup); \
544 TRAMPOLINE_TEMPLATE (_dl_runtime_profile, profile_fixup);
545 #else
546 #define ELF_MACHINE_RUNTIME_TRAMPOLINE \
547 TRAMPOLINE_TEMPLATE (_dl_runtime_resolve, fixup); \
548 TRAMPOLINE_TEMPLATE (_dl_runtime_profile, fixup);
549 #endif
550
551 /* The PLT uses Elf64_Rela relocs. */
552 #define elf_machine_relplt elf_machine_rela
553
554 /* Initial entry point code for the dynamic linker.
555 The C function `_dl_start' is the real entry point;
556 its return value is the user program's entry point. */
557
558 #define __S1(x) #x
559 #define __S(x) __S1(x)
560
561 #define RTLD_START __asm__ ( "\n" \
562 " .text\n" \
563 " .global _start\n" \
564 " .type _start, @function\n" \
565 " .align 32\n" \
566 "_start:\n" \
567 " /* Make room for functions to drop their arguments on the stack. */\n" \
568 " sub %sp, 6*8, %sp\n" \
569 " /* Pass pointer to argument block to _dl_start. */\n" \
570 " call _dl_start\n" \
571 " add %sp," __S(STACK_BIAS) "+22*8,%o0\n" \
572 " /* FALLTHRU */\n" \
573 " .size _start, .-_start\n" \
574 "\n" \
575 " .global _dl_start_user\n" \
576 " .type _dl_start_user, @function\n" \
577 "_dl_start_user:\n" \
578 " /* Load the GOT register. */\n" \
579 "1: call 11f\n" \
580 " sethi %hi(_GLOBAL_OFFSET_TABLE_-(1b-.)), %l7\n" \
581 "11: or %l7, %lo(_GLOBAL_OFFSET_TABLE_-(1b-.)), %l7\n" \
582 " /* Store the highest stack address. */\n" \
583 " sethi %hi(__libc_stack_end), %g5\n" \
584 " add %l7, %o7, %l7\n" \
585 " or %g5, %lo(__libc_stack_end), %g5\n" \
586 " /* Save the user entry point address in %l0. */\n" \
587 " mov %o0, %l0\n" \
588 " ldx [%l7 + %g5], %l1\n" \
589 " sethi %hi(_dl_skip_args), %g5\n" \
590 " add %sp, 6*8, %l2\n" \
591 " /* See if we were run as a command with the executable file name as an\n" \
592 " extra leading argument. If so, we must shift things around since we\n" \
593 " must keep the stack doubleword aligned. */\n" \
594 " or %g5, %lo(_dl_skip_args), %g5\n" \
595 " stx %l2, [%l1]\n" \
596 " ldx [%l7 + %g5], %i0\n" \
597 " ld [%i0], %i0\n" \
598 " brz,pt %i0, 2f\n" \
599 " ldx [%sp + " __S(STACK_BIAS) " + 22*8], %i5\n" \
600 " /* Find out how far to shift. */\n" \
601 " sethi %hi(_dl_argv), %l4\n" \
602 " sub %i5, %i0, %i5\n" \
603 " or %l4, %lo(_dl_argv), %l4\n" \
604 " sllx %i0, 3, %l6\n" \
605 " ldx [%l7 + %l4], %l4\n" \
606 " stx %i5, [%sp + " __S(STACK_BIAS) " + 22*8]\n" \
607 " add %sp, " __S(STACK_BIAS) " + 23*8, %i1\n" \
608 " add %i1, %l6, %i2\n" \
609 " ldx [%l4], %l5\n" \
610 " /* Copy down argv. */\n" \
611 "12: ldx [%i2], %i3\n" \
612 " add %i2, 8, %i2\n" \
613 " stx %i3, [%i1]\n" \
614 " brnz,pt %i3, 12b\n" \
615 " add %i1, 8, %i1\n" \
616 " sub %l5, %l6, %l5\n" \
617 " /* Copy down envp. */\n" \
618 "13: ldx [%i2], %i3\n" \
619 " add %i2, 8, %i2\n" \
620 " stx %i3, [%i1]\n" \
621 " brnz,pt %i3, 13b\n" \
622 " add %i1, 8, %i1\n" \
623 " /* Copy down auxiliary table. */\n" \
624 "14: ldx [%i2], %i3\n" \
625 " ldx [%i2 + 8], %i4\n" \
626 " add %i2, 16, %i2\n" \
627 " stx %i3, [%i1]\n" \
628 " stx %i4, [%i1 + 8]\n" \
629 " brnz,pt %i3, 14b\n" \
630 " add %i1, 16, %i1\n" \
631 " stx %l5, [%l4]\n" \
632 " /* %o0 = _dl_loaded, %o1 = argc, %o2 = argv, %o3 = envp. */\n" \
633 "2: sethi %hi(_dl_loaded), %o0\n" \
634 " add %sp, " __S(STACK_BIAS) " + 23*8, %o2\n" \
635 " orcc %o0, %lo(_dl_loaded), %o0\n" \
636 " sllx %i5, 3, %o3\n" \
637 " ldx [%l7 + %o0], %o0\n" \
638 " add %o3, 8, %o3\n" \
639 " mov %i5, %o1\n" \
640 " add %o2, %o3, %o3\n" \
641 " call _dl_init\n" \
642 " ldx [%o0], %o0\n" \
643 " /* Pass our finalizer function to the user in %g1. */\n" \
644 " sethi %hi(_dl_fini), %g1\n" \
645 " or %g1, %lo(_dl_fini), %g1\n" \
646 " ldx [%l7 + %g1], %g1\n" \
647 " /* Jump to the user's entry point and deallocate the extra stack we got. */\n" \
648 " jmp %l0\n" \
649 " add %sp, 6*8, %sp\n" \
650 " .size _dl_start_user, . - _dl_start_user\n" \
651 " .previous\n");