1/* $NetBSD: rtld_start.S,v 1.4 2001/09/26 04:06:43 mycroft Exp $ */ 2 3/*- 4 * Copyright (C) 1998 Tsubai Masanari 5 * All rights reserved. 6 * 7 * Redistribution and use in source and binary forms, with or without 8 * modification, are permitted provided that the following conditions 9 * are met: 10 * 1. Redistributions of source code must retain the above copyright 11 * notice, this list of conditions and the following disclaimer. 12 * 2. Redistributions in binary form must reproduce the above copyright 13 * notice, this list of conditions and the following disclaimer in the 14 * documentation and/or other materials provided with the distribution. 15 * 3. The name of the author may not be used to endorse or promote products 16 * derived from this software without specific prior written permission. 17 * 18 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR 19 * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES 20 * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. 21 * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT, 22 * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT 23 * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, 24 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY 25 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT 26 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE 27 * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 28 */ 29 30#include <machine/asm.h> 31#include <machine/spr.h> /* For SPR_SPEFSCR if needed. */ 32 33.extern _GLOBAL_OFFSET_TABLE_ 34.extern _DYNAMIC 35 36_ENTRY(.rtld_start) 37 stwu %r1,-48(%r1) /* 16-byte aligned stack for reg saves + 38 exit_proc & obj _rtld args + 39 backchain & lrsave stack frame */ 40 stw %r3,16(%r1) /* argc */ 41 stw %r4,20(%r1) /* argv */ 42 stw %r5,24(%r1) /* envp */ 43/* stw %r6,28(%r1) *//* obj (always 0) */ 44/* stw %r7,32(%r1) *//* cleanup (always 0) */ 45 stw %r8,36(%r1) /* ps_strings */ 46 47 /* 48 * Perform initial relocation of ld-elf.so. Not as easy as it 49 * sounds. 50 * - perform small forward branch to put PC into link reg 51 * - use link-time constants to determine offset to the 52 * _DYNAMIC section and the GOT. Add these to the PC to 53 * convert to absolute addresses. 54 * - read GOT[0], which is the SVR4 ABI-specified link-time 55 * value of _DYNAMIC. Subtract this value from the absolute 56 * value to determine the load address 57 * - call reloc_non_plt_self() to fix up ld-elf.so's relocations 58 */ 59 bcl 20,31,1f 601: mflr %r30 61 mr %r3,%r30 # save for _DYNAMIC 62 addis %r30,%r30,_GLOBAL_OFFSET_TABLE_-1b@ha 63 addi %r30,%r30,_GLOBAL_OFFSET_TABLE_-1b@l 64 addis %r3,%r3,_DYNAMIC-1b@ha # get _DYNAMIC actual address 65 addi %r3,%r3,_DYNAMIC-1b@l 66 lwz %r28,0(%r30) # get base-relative &_DYNAMIC 67 sub %r28,%r3,%r28 # r28 = relocbase 68 mr %r4,%r28 # r4 = relocbase 69 bl reloc_non_plt_self /* reloc_non_plt_self(&_DYNAMIC,base) */ 70 71 /* 72 * The _rtld() function likes to see a stack layout containing 73 * { argc, argv[0], argv[1] ... argv[N], 0, env[0], ... , env[N] } 74 * Since the PowerPC stack was 16-byte aligned at exec time, the 75 * original stack layout has to be found by moving back a word 76 * from the argv pointer. 77 */ 78 lwz %r4,20(%r1) /* restore argv */ 79 addi %r3,%r4,-4 /* locate argc ptr, &argv[-1] */ 80 81 addi %r4,%r1,8 /* &exit_proc on stack */ 82 addi %r5,%r1,12 /* &obj_main on stack */ 83 84 bl _rtld /* &_start = _rtld(sp, &exit_proc, &obj_main)*/ 85 mtlr %r3 86 87 /* 88 * Restore args, with new obj/exit proc 89 */ 90 lwz %r3,16(%r1) /* argc */ 91 lwz %r4,20(%r1) /* argv */ 92 lwz %r5,24(%r1) /* envp */ 93 lwz %r6,12(%r1) /* obj */ 94 lwz %r7,8(%r1) /* exit proc */ 95 lwz %r8,36(%r1) /* ps_strings */ 96 addi %r1,%r1,48 /* restore original stackptr */ 97 98 blrl /* _start(argc, argv, envp, obj, cleanup, ps_strings) */ 99 100 li %r0,1 /* _exit() */ 101 sc 102_END(.rtld_start) 103 104#ifdef __SPE__ 105/* stack space for 30 GPRs + SPEFSCR/ACC/lr/cr */ 106#define NREGS 31 107#define GPRWIDTH 8 108#define FUDGE 4 /* Fudge factor for alignment */ 109#else 110/* stack space for 30 GPRs + lr/cr */ 111#define NREGS 30 112#define GPRWIDTH 4 113#define FUDGE 4 114#endif 115/* Stack frame needs the 12-byte ABI frame plus fudge factor. */ 116#define STACK_SIZE (NREGS * GPRWIDTH + 4 * 2 + 12 + FUDGE) 117 118/* 119 * _rtld_bind_secureplt_start() 120 * 121 * Call into the MI binder (Secure-PLT stub). 122 * secure-plt expects %r11 to be the offset to the rela entry. 123 * bss-plt expects %r11 to be index of the rela entry. 124 * So for bss-plt, we multiply the index by 12 to get the offset. 125 */ 126_ENTRY(_rtld_bind_secureplt_start) 127 stwu %r1,-STACK_SIZE(%r1) 128#ifdef __SPE__ 129 evstdd %r0,24(%r1) 130#else 131 stw %r0,20(%r1) # save r0 132#endif 133 134 /* 135 * Instead of division which is costly we will use multiplicative 136 * inverse. a / n = ((a * inv(n)) >> 32) 137 * where inv(n) = (0x100000000 + n - 1) / n 138 */ 139 mr %r0,%r11 140 lis %r11,0x15555556@h # load multiplicative inverse of 12 141 ori %r11,%r11,0x15555556@l 142 mulhwu %r11,%r11,%r0 # get high half of multiplication 143 b 1f 144_END(_rtld_bind_secureplt_start) 145 146/* 147 * _rtld_bind_start() 148 * 149 * Call into the MI binder. This routine is reached via the PLT call cell, 150 * and then _rtld_powerpc_pltresolve(). 151 * On entry, %r11 contains the index of the PLT cell, and %r12 contains 152 * a pointer to the ELF object for the file. 153 * Save all registers, call into the binder to resolve and fixup the external 154 * routine, and then transfer to the external routine on return. 155 */ 156 .globl _rtld_bind 157 158_ENTRY(_rtld_bind_start) 159 stwu %r1,-STACK_SIZE(%r1) 160#ifdef __SPE__ 161 evstdd %r0,24(%r1) 162#else 163 stw %r0,20(%r1) # save r0 164#endif 1651: 166 mflr %r0 167 stw %r0,16(%r1) # save lr 168 mfcr %r0 169 stw %r0,12(%r1) # save cr 170#ifdef __SPE__ 171 evstdd %r3, 32(%r1) 172 evstdd %r4, 40(%r1) 173 evstdd %r5, 48(%r1) 174 evstdd %r6, 56(%r1) 175 evstdd %r7, 64(%r1) 176 evstdd %r8, 72(%r1) 177 evstdd %r9, 80(%r1) 178 evstdd %r10, 88(%r1) 179 evstdd %r11, 96(%r1) 180 evstdd %r12, 104(%r1) 181 evstdd %r13, 112(%r1) 182 evstdd %r14, 120(%r1) 183 evstdd %r15, 128(%r1) 184 evstdd %r16, 136(%r1) 185 evstdd %r17, 144(%r1) 186 evstdd %r18, 152(%r1) 187 evstdd %r19, 160(%r1) 188 evstdd %r20, 168(%r1) 189 evstdd %r21, 176(%r1) 190 evstdd %r22, 184(%r1) 191 evstdd %r23, 192(%r1) 192 evstdd %r24, 200(%r1) 193 evstdd %r25, 208(%r1) 194 evstdd %r26, 216(%r1) 195 evstdd %r27, 224(%r1) 196 evstdd %r28, 232(%r1) 197 evstdd %r29, 240(%r1) 198 evstdd %r30, 248(%r1) 199 li %r3, 256 200 evstddx %r31, %r1, %r3 201 evxor %r0, %r0, %r0 202 li %r3, 264 203 evmwumiaa %r0, %r0, %r0 204 evstddx %r0, %r1, %r3 205 mfspr %r3, SPR_SPEFSCR 206 stw %r3, 20(%r1) 207#else 208 stmw %r3,24(%r1) # save r3-r31 209#endif 210 211 mr %r3,%r12 # obj 212 mulli %r4,%r11,12 # rela index * sizeof(Elf_Rela) 213 bl _rtld_bind # target addr = _rtld_bind(obj, reloff) 214 mtctr %r3 # move absolute target addr into ctr 215 216#ifdef __SPE__ 217 lwz %r3, 20(%r1) 218 mtspr SPR_SPEFSCR, %r3 219 li %r3, 264 220 evlddx %r0, %r3, %r1 221 evmra %r0, %r0 222 evldd %r3, 32(%r1) 223 evldd %r4, 40(%r1) 224 evldd %r5, 48(%r1) 225 evldd %r6, 56(%r1) 226 evldd %r7, 64(%r1) 227 evldd %r8, 72(%r1) 228 evldd %r9, 80(%r1) 229 evldd %r10, 88(%r1) 230 evldd %r11, 96(%r1) 231 evldd %r12, 104(%r1) 232 evldd %r13, 112(%r1) 233 evldd %r14, 120(%r1) 234 evldd %r15, 128(%r1) 235 evldd %r16, 136(%r1) 236 evldd %r17, 144(%r1) 237 evldd %r18, 152(%r1) 238 evldd %r19, 160(%r1) 239 evldd %r20, 168(%r1) 240 evldd %r21, 176(%r1) 241 evldd %r22, 184(%r1) 242 evldd %r23, 192(%r1) 243 evldd %r24, 200(%r1) 244 evldd %r25, 208(%r1) 245 evldd %r26, 216(%r1) 246 evldd %r27, 224(%r1) 247 evldd %r28, 232(%r1) 248 evldd %r29, 240(%r1) 249 evldd %r30, 248(%r1) 250 li %r0, 256 251 evlddx %r31, %r1, %r0 252#else 253 lmw %r3,24(%r1) # restore r3-r31 254#endif 255 lwz %r0,12(%r1) # restore cr 256 mtcr %r0 257 lwz %r0,16(%r1) # restore lr 258 mtlr %r0 259#ifdef __SPE__ 260 evldd %r0,24(%r1) 261#else 262 lwz %r0,20(%r1) # restore r0 263#endif 264 265 addi %r1,%r1,STACK_SIZE # restore stack 266 bctr # jump to target 267_END(_rtld_bind_start) 268 269 270/* 271 * _rtld_powerpc_pltresolve() 272 * 273 * This routine is copied into the latter part of the 72-byte reserved 274 * area at the start of the PLT. The absolute address of the _rtld_bind_start 275 * routine, and the ELF object for the loaded file, are inserted into 276 * the code by the reloc.c:init_pltgot() routine. 277 * The first time an external routine is called, the PLT slot will 278 * set up %r11 to the offset of the slot, and will jump to this routine. 279 * The ELF object is shifted into %r11, and _rtld_bind_start is called 280 * to complete the binding. 281 */ 282_ENTRY(_rtld_powerpc_pltlongresolve) 283 lis %r12,0 # lis 12,jmptab@ha 284 addi %r12,%r12,0 # addi 12,12,jmptab@l 285 subf %r11,%r12,%r11 # reloff 286 li %r12,2 287 srw %r11,%r11,%r12 # index = reloff/sizeof(Elf_Addr) 288_END(_rtld_powerpc_pltlongresolve) 289_ENTRY(_rtld_powerpc_pltresolve) 290 lis %r12,0 # lis 12,_rtld_bind_start@ha 291 addi %r12,%r12,0 # addi 12,12,_rtld_bind_start@l 292 mtctr %r12 293 lis %r12,0 # lis 12,obj@ha 294 addi %r12,%r12,0 # addi 12,12,obj@l 295 bctr 296_END(_rtld_powerpc_pltresolve) 297 298/* 299 * _rtld_powerpc_pltcall() 300 * 301 * This routine is copied into the 72-byte reserved area at the 302 * start of the PLT. The reloc.c:init_pltgot() routine inserts 303 * the absolute address of the jumptable. 304 * Control is transferred to this routine when the binder has 305 * located the external routine, but determined that it is > 32Mb 306 * from the PLT slot. Code is inserted into the PLT slot to set up 307 * %r11 with the jumptable index, and jump to here, where the 308 * absolute address of the external routine is loaded from the 309 * jumptable and transferred to 310 */ 311_ENTRY(_rtld_powerpc_pltcall) 312 slwi %r11,%r11,2 # jmptab offset = index * 4 313 addis %r11,%r11,0 # addis 11,11,jmptab@ha 314 lwz %r11,0(%r11) # lwz 11,jmptab@l(11) 315 mtctr %r11 316 bctr # (*jmptab[index])() 317_END(_rtld_powerpc_pltcall) 318 319 .section .note.GNU-stack,"",%progbits 320