xref: /freebsd/libexec/rtld-elf/powerpc/rtld_start.S (revision edf8578117e8844e02c0121147f45e4609b30680)
1/*      $NetBSD: rtld_start.S,v 1.4 2001/09/26 04:06:43 mycroft Exp $   */
2
3/*-
4 * Copyright (C) 1998   Tsubai Masanari
5 * All rights reserved.
6 *
7 * Redistribution and use in source and binary forms, with or without
8 * modification, are permitted provided that the following conditions
9 * are met:
10 * 1. Redistributions of source code must retain the above copyright
11 *    notice, this list of conditions and the following disclaimer.
12 * 2. Redistributions in binary form must reproduce the above copyright
13 *    notice, this list of conditions and the following disclaimer in the
14 *    documentation and/or other materials provided with the distribution.
15 * 3. The name of the author may not be used to endorse or promote products
16 *    derived from this software without specific prior written permission.
17 *
18 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
19 * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
20 * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
21 * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
22 * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
23 * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
24 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
25 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
26 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
27 * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
28 */
29
30#include <machine/asm.h>
31#include <machine/spr.h>	/* For SPR_SPEFSCR if needed. */
32
33.extern _GLOBAL_OFFSET_TABLE_
34.extern _DYNAMIC
35
36_ENTRY(.rtld_start)
37	stwu    %r1,-48(%r1)	/* 16-byte aligned stack for reg saves +
38				exit_proc & obj _rtld args +
39				backchain & lrsave stack frame */
40	stw     %r3,16(%r1)	/*  argc */
41	stw     %r4,20(%r1)	/*  argv */
42	stw     %r5,24(%r1)	/*  envp */
43/*	stw     %r6,28(%r1)   *//*  obj (always 0) */
44/*	stw     %r7,32(%r1)   *//*  cleanup (always 0) */
45	stw     %r8,36(%r1)	/*  ps_strings */
46
47	/*
48	 * Perform initial relocation of ld-elf.so. Not as easy as it
49	 * sounds.
50	 *  - perform small forward branch to put PC into link reg
51	 *  - use link-time constants to determine offset to the
52	 *    _DYNAMIC section and the GOT. Add these to the PC to
53	 *    convert to absolute addresses.
54	 *  - read GOT[0], which is the SVR4 ABI-specified link-time
55	 *    value of _DYNAMIC. Subtract this value from the absolute
56	 *    value to determine the load address
57	 *  - call reloc_non_plt_self() to fix up ld-elf.so's relocations
58	 */
59	bcl	20,31,1f
601:	mflr	%r30
61	mr	%r3,%r30		# save for _DYNAMIC
62	addis	%r30,%r30,_GLOBAL_OFFSET_TABLE_-1b@ha
63	addi	%r30,%r30,_GLOBAL_OFFSET_TABLE_-1b@l
64	addis	%r3,%r3,_DYNAMIC-1b@ha	# get _DYNAMIC actual address
65	addi	%r3,%r3,_DYNAMIC-1b@l
66	lwz	%r28,0(%r30)		# get base-relative &_DYNAMIC
67	sub	%r28,%r3,%r28		# r28 = relocbase
68	mr	%r4,%r28		# r4 = relocbase
69	bl	reloc_non_plt_self /* reloc_non_plt_self(&_DYNAMIC,base) */
70
71	/*
72	 * The _rtld() function likes to see a stack layout containing
73	 * { argc, argv[0], argv[1] ... argv[N], 0, env[0], ... , env[N] }
74	 * Since the PowerPC stack was 16-byte aligned at exec time, the
75	 * original stack layout has to be found by moving back a word
76	 * from the argv pointer.
77	 */
78        lwz     %r4,20(%r1)	/* restore argv */
79        addi    %r3,%r4,-4	/* locate argc ptr, &argv[-1] */
80
81	addi	%r4,%r1,8	/* &exit_proc on stack */
82	addi	%r5,%r1,12	/* &obj_main on stack */
83
84	bl      _rtld		/* &_start = _rtld(sp, &exit_proc, &obj_main)*/
85	mtlr    %r3
86
87	/*
88	 * Restore args, with new obj/exit proc
89	 */
90	lwz     %r3,16(%r1)     /* argc */
91	lwz     %r4,20(%r1)	/* argv */
92	lwz     %r5,24(%r1)	/* envp */
93	lwz     %r6,12(%r1)	/* obj */
94	lwz     %r7,8(%r1)	/* exit proc */
95	lwz     %r8,36(%r1)	/* ps_strings */
96        addi    %r1,%r1,48	/* restore original stackptr */
97
98	blrl	/* _start(argc, argv, envp, obj, cleanup, ps_strings) */
99
100	li      %r0,1		/* _exit() */
101	sc
102_END(.rtld_start)
103
104#ifdef __SPE__
105/* stack space for 30 GPRs + SPEFSCR/ACC/lr/cr */
106#define	NREGS		31
107#define	GPRWIDTH	8
108#define	FUDGE		4	/* Fudge factor for alignment */
109#else
110/* stack space for 30 GPRs + lr/cr */
111#define	NREGS		30
112#define	GPRWIDTH	4
113#define	FUDGE		4
114#endif
115/* Stack frame needs the 12-byte ABI frame plus fudge factor. */
116#define	STACK_SIZE	(NREGS * GPRWIDTH + 4 * 2 + 12 + FUDGE)
117
118/*
119 * _rtld_bind_secureplt_start()
120 *
121 * Call into the MI binder (Secure-PLT stub).
122 * secure-plt expects %r11 to be the offset to the rela entry.
123 * bss-plt expects %r11 to be index of the rela entry.
124 * So for bss-plt, we multiply the index by 12 to get the offset.
125 */
126_ENTRY(_rtld_bind_secureplt_start)
127	stwu    %r1,-STACK_SIZE(%r1)
128#ifdef __SPE__
129	evstdd	%r0,24(%r1)
130#else
131	stw     %r0,20(%r1)		# save r0
132#endif
133
134	/*
135	 * Instead of division which is costly we will use multiplicative
136	 * inverse.  a / n = ((a * inv(n)) >> 32)
137	 * where inv(n) = (0x100000000 + n - 1) / n
138	 */
139	mr	%r0,%r11
140	lis	%r11,0x15555556@h	# load multiplicative inverse of 12
141	ori	%r11,%r11,0x15555556@l
142	mulhwu	%r11,%r11,%r0		# get high half of multiplication
143	b	1f
144_END(_rtld_bind_secureplt_start)
145
146/*
147 * _rtld_bind_start()
148 *
149 * Call into the MI binder. This routine is reached via the PLT call cell,
150 * and then _rtld_powerpc_pltresolve().
151 * On entry, %r11 contains the index of the PLT cell, and %r12 contains
152 * a pointer to the ELF object for the file.
153 *  Save all registers, call into the binder to resolve and fixup the external
154 * routine, and then transfer to the external routine on return.
155 */
156	.globl  _rtld_bind
157
158_ENTRY(_rtld_bind_start)
159	stwu    %r1,-STACK_SIZE(%r1)
160#ifdef __SPE__
161	evstdd	%r0,24(%r1)
162#else
163	stw     %r0,20(%r1)		# save r0
164#endif
1651:
166	mflr    %r0
167	stw     %r0,16(%r1)		# save lr
168	mfcr    %r0
169	stw     %r0,12(%r1)		# save cr
170#ifdef __SPE__
171	evstdd	%r3, 32(%r1)
172	evstdd	%r4, 40(%r1)
173	evstdd	%r5, 48(%r1)
174	evstdd	%r6, 56(%r1)
175	evstdd	%r7, 64(%r1)
176	evstdd	%r8, 72(%r1)
177	evstdd	%r9, 80(%r1)
178	evstdd	%r10, 88(%r1)
179	evstdd	%r11, 96(%r1)
180	evstdd	%r12, 104(%r1)
181	evstdd	%r13, 112(%r1)
182	evstdd	%r14, 120(%r1)
183	evstdd	%r15, 128(%r1)
184	evstdd	%r16, 136(%r1)
185	evstdd	%r17, 144(%r1)
186	evstdd	%r18, 152(%r1)
187	evstdd	%r19, 160(%r1)
188	evstdd	%r20, 168(%r1)
189	evstdd	%r21, 176(%r1)
190	evstdd	%r22, 184(%r1)
191	evstdd	%r23, 192(%r1)
192	evstdd	%r24, 200(%r1)
193	evstdd	%r25, 208(%r1)
194	evstdd	%r26, 216(%r1)
195	evstdd	%r27, 224(%r1)
196	evstdd	%r28, 232(%r1)
197	evstdd	%r29, 240(%r1)
198	evstdd	%r30, 248(%r1)
199	li	%r3, 256
200	evstddx	%r31, %r1, %r3
201	evxor	%r0, %r0, %r0
202	li	%r3, 264
203	evmwumiaa	%r0, %r0, %r0
204	evstddx	%r0, %r1, %r3
205	mfspr	%r3, SPR_SPEFSCR
206	stw	%r3, 20(%r1)
207#else
208	stmw    %r3,24(%r1)		# save r3-r31
209#endif
210
211	mr      %r3,%r12		# obj
212	mulli   %r4,%r11,12		# rela index * sizeof(Elf_Rela)
213	bl      _rtld_bind		# target addr = _rtld_bind(obj, reloff)
214	mtctr   %r3			# move absolute target addr into ctr
215
216#ifdef __SPE__
217	lwz	%r3, 20(%r1)
218	mtspr	SPR_SPEFSCR, %r3
219	li	%r3, 264
220	evlddx	%r0, %r3, %r1
221	evmra	%r0, %r0
222	evldd	%r3, 32(%r1)
223	evldd	%r4, 40(%r1)
224	evldd	%r5, 48(%r1)
225	evldd	%r6, 56(%r1)
226	evldd	%r7, 64(%r1)
227	evldd	%r8, 72(%r1)
228	evldd	%r9, 80(%r1)
229	evldd	%r10, 88(%r1)
230	evldd	%r11, 96(%r1)
231	evldd	%r12, 104(%r1)
232	evldd	%r13, 112(%r1)
233	evldd	%r14, 120(%r1)
234	evldd	%r15, 128(%r1)
235	evldd	%r16, 136(%r1)
236	evldd	%r17, 144(%r1)
237	evldd	%r18, 152(%r1)
238	evldd	%r19, 160(%r1)
239	evldd	%r20, 168(%r1)
240	evldd	%r21, 176(%r1)
241	evldd	%r22, 184(%r1)
242	evldd	%r23, 192(%r1)
243	evldd	%r24, 200(%r1)
244	evldd	%r25, 208(%r1)
245	evldd	%r26, 216(%r1)
246	evldd	%r27, 224(%r1)
247	evldd	%r28, 232(%r1)
248	evldd	%r29, 240(%r1)
249	evldd	%r30, 248(%r1)
250	li	%r0, 256
251	evlddx	%r31, %r1, %r0
252#else
253        lmw     %r3,24(%r1)		# restore r3-r31
254#endif
255        lwz     %r0,12(%r1)		# restore cr
256        mtcr    %r0
257        lwz     %r0,16(%r1)		# restore lr
258        mtlr    %r0
259#ifdef __SPE__
260	evldd	%r0,24(%r1)
261#else
262        lwz     %r0,20(%r1)		# restore r0
263#endif
264
265        addi    %r1,%r1,STACK_SIZE	# restore stack
266        bctr				# jump to target
267_END(_rtld_bind_start)
268
269
270/*
271 * _rtld_powerpc_pltresolve()
272 *
273 *  This routine is copied into the latter part of the 72-byte reserved
274 * area at the start of the PLT. The absolute address of the _rtld_bind_start
275 * routine, and the ELF object for the loaded file, are inserted into
276 * the code by the reloc.c:init_pltgot() routine.
277 *  The first time an external routine is called, the PLT slot will
278 * set up %r11 to the offset of the slot, and will jump to this routine.
279 * The ELF object is shifted into %r11, and _rtld_bind_start is called
280 * to complete the binding.
281 */
282_ENTRY(_rtld_powerpc_pltlongresolve)
283	lis	%r12,0			# lis	12,jmptab@ha
284	addi    %r12,%r12,0		# addi  12,12,jmptab@l
285	subf	%r11,%r12,%r11		# reloff
286	li	%r12,2
287	srw	%r11,%r11,%r12		# index = reloff/sizeof(Elf_Addr)
288_END(_rtld_powerpc_pltlongresolve)
289_ENTRY(_rtld_powerpc_pltresolve)
290        lis     %r12,0			# lis   12,_rtld_bind_start@ha
291        addi    %r12,%r12,0		# addi  12,12,_rtld_bind_start@l
292        mtctr   %r12
293        lis     %r12,0			# lis   12,obj@ha
294        addi    %r12,%r12,0		# addi  12,12,obj@l
295        bctr
296_END(_rtld_powerpc_pltresolve)
297
298/*
299 * _rtld_powerpc_pltcall()
300 *
301 *  This routine is copied into the 72-byte reserved area at the
302 * start of the PLT. The reloc.c:init_pltgot() routine inserts
303 * the absolute address of the jumptable.
304 *  Control is transferred to this routine when the binder has
305 * located the external routine, but determined that it is > 32Mb
306 * from the PLT slot. Code is inserted into the PLT slot to set up
307 * %r11 with the jumptable index, and jump to here, where the
308 * absolute address of the external routine is loaded from the
309 * jumptable and transferred to
310 */
311_ENTRY(_rtld_powerpc_pltcall)
312        slwi    %r11,%r11,2		# jmptab offset = index * 4
313        addis   %r11,%r11,0		# addis 11,11,jmptab@ha
314        lwz     %r11,0(%r11)		# lwz   11,jmptab@l(11)
315        mtctr   %r11
316        bctr				# (*jmptab[index])()
317_END(_rtld_powerpc_pltcall)
318
319	.section .note.GNU-stack,"",%progbits
320