1 /* 2 * FP/SIMD state saving and restoring macros 3 * 4 * Copyright (C) 2012 ARM Ltd. 5 * Author: Catalin Marinas <catalin.marinas@arm.com> 6 * 7 * This program is free software; you can redistribute it and/or modify 8 * it under the terms of the GNU General Public License version 2 as 9 * published by the Free Software Foundation. 10 * 11 * This program is distributed in the hope that it will be useful, 12 * but WITHOUT ANY WARRANTY; without even the implied warranty of 13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the 14 * GNU General Public License for more details. 15 * 16 * You should have received a copy of the GNU General Public License 17 * along with this program. If not, see <http://www.gnu.org/licenses/>. 18 */ 19 20 .macro fpsimd_save state, tmpnr 21 stp q0, q1, [\state, #16 * 0] 22 stp q2, q3, [\state, #16 * 2] 23 stp q4, q5, [\state, #16 * 4] 24 stp q6, q7, [\state, #16 * 6] 25 stp q8, q9, [\state, #16 * 8] 26 stp q10, q11, [\state, #16 * 10] 27 stp q12, q13, [\state, #16 * 12] 28 stp q14, q15, [\state, #16 * 14] 29 stp q16, q17, [\state, #16 * 16] 30 stp q18, q19, [\state, #16 * 18] 31 stp q20, q21, [\state, #16 * 20] 32 stp q22, q23, [\state, #16 * 22] 33 stp q24, q25, [\state, #16 * 24] 34 stp q26, q27, [\state, #16 * 26] 35 stp q28, q29, [\state, #16 * 28] 36 stp q30, q31, [\state, #16 * 30]! 37 mrs x\tmpnr, fpsr 38 str w\tmpnr, [\state, #16 * 2] 39 mrs x\tmpnr, fpcr 40 str w\tmpnr, [\state, #16 * 2 + 4] 41 .endm 42 43 .macro fpsimd_restore_fpcr state, tmp 44 /* 45 * Writes to fpcr may be self-synchronising, so avoid restoring 46 * the register if it hasn't changed. 47 */ 48 mrs \tmp, fpcr 49 cmp \tmp, \state 50 b.eq 9999f 51 msr fpcr, \state 52 9999: 53 .endm 54 55 /* Clobbers \state */ 56 .macro fpsimd_restore state, tmpnr 57 ldp q0, q1, [\state, #16 * 0] 58 ldp q2, q3, [\state, #16 * 2] 59 ldp q4, q5, [\state, #16 * 4] 60 ldp q6, q7, [\state, #16 * 6] 61 ldp q8, q9, [\state, #16 * 8] 62 ldp q10, q11, [\state, #16 * 10] 63 ldp q12, q13, [\state, #16 * 12] 64 ldp q14, q15, [\state, #16 * 14] 65 ldp q16, q17, [\state, #16 * 16] 66 ldp q18, q19, [\state, #16 * 18] 67 ldp q20, q21, [\state, #16 * 20] 68 ldp q22, q23, [\state, #16 * 22] 69 ldp q24, q25, [\state, #16 * 24] 70 ldp q26, q27, [\state, #16 * 26] 71 ldp q28, q29, [\state, #16 * 28] 72 ldp q30, q31, [\state, #16 * 30]! 73 ldr w\tmpnr, [\state, #16 * 2] 74 msr fpsr, x\tmpnr 75 ldr w\tmpnr, [\state, #16 * 2 + 4] 76 fpsimd_restore_fpcr x\tmpnr, \state 77 .endm 78 79 /* Sanity-check macros to help avoid encoding garbage instructions */ 80 81 .macro _check_general_reg nr 82 .if (\nr) < 0 || (\nr) > 30 83 .error "Bad register number \nr." 84 .endif 85 .endm 86 87 .macro _sve_check_zreg znr 88 .if (\znr) < 0 || (\znr) > 31 89 .error "Bad Scalable Vector Extension vector register number \znr." 90 .endif 91 .endm 92 93 .macro _sve_check_preg pnr 94 .if (\pnr) < 0 || (\pnr) > 15 95 .error "Bad Scalable Vector Extension predicate register number \pnr." 96 .endif 97 .endm 98 99 .macro _check_num n, min, max 100 .if (\n) < (\min) || (\n) > (\max) 101 .error "Number \n out of range [\min,\max]" 102 .endif 103 .endm 104 105 /* SVE instruction encodings for non-SVE-capable assemblers */ 106 107 /* STR (vector): STR Z\nz, [X\nxbase, #\offset, MUL VL] */ 108 .macro _sve_str_v nz, nxbase, offset=0 109 _sve_check_zreg \nz 110 _check_general_reg \nxbase 111 _check_num (\offset), -0x100, 0xff 112 .inst 0xe5804000 \ 113 | (\nz) \ 114 | ((\nxbase) << 5) \ 115 | (((\offset) & 7) << 10) \ 116 | (((\offset) & 0x1f8) << 13) 117 .endm 118 119 /* LDR (vector): LDR Z\nz, [X\nxbase, #\offset, MUL VL] */ 120 .macro _sve_ldr_v nz, nxbase, offset=0 121 _sve_check_zreg \nz 122 _check_general_reg \nxbase 123 _check_num (\offset), -0x100, 0xff 124 .inst 0x85804000 \ 125 | (\nz) \ 126 | ((\nxbase) << 5) \ 127 | (((\offset) & 7) << 10) \ 128 | (((\offset) & 0x1f8) << 13) 129 .endm 130 131 /* STR (predicate): STR P\np, [X\nxbase, #\offset, MUL VL] */ 132 .macro _sve_str_p np, nxbase, offset=0 133 _sve_check_preg \np 134 _check_general_reg \nxbase 135 _check_num (\offset), -0x100, 0xff 136 .inst 0xe5800000 \ 137 | (\np) \ 138 | ((\nxbase) << 5) \ 139 | (((\offset) & 7) << 10) \ 140 | (((\offset) & 0x1f8) << 13) 141 .endm 142 143 /* LDR (predicate): LDR P\np, [X\nxbase, #\offset, MUL VL] */ 144 .macro _sve_ldr_p np, nxbase, offset=0 145 _sve_check_preg \np 146 _check_general_reg \nxbase 147 _check_num (\offset), -0x100, 0xff 148 .inst 0x85800000 \ 149 | (\np) \ 150 | ((\nxbase) << 5) \ 151 | (((\offset) & 7) << 10) \ 152 | (((\offset) & 0x1f8) << 13) 153 .endm 154 155 /* RDVL X\nx, #\imm */ 156 .macro _sve_rdvl nx, imm 157 _check_general_reg \nx 158 _check_num (\imm), -0x20, 0x1f 159 .inst 0x04bf5000 \ 160 | (\nx) \ 161 | (((\imm) & 0x3f) << 5) 162 .endm 163 164 /* RDFFR (unpredicated): RDFFR P\np.B */ 165 .macro _sve_rdffr np 166 _sve_check_preg \np 167 .inst 0x2519f000 \ 168 | (\np) 169 .endm 170 171 /* WRFFR P\np.B */ 172 .macro _sve_wrffr np 173 _sve_check_preg \np 174 .inst 0x25289000 \ 175 | ((\np) << 5) 176 .endm 177 178 .macro __for from:req, to:req 179 .if (\from) == (\to) 180 _for__body \from 181 .else 182 __for \from, (\from) + ((\to) - (\from)) / 2 183 __for (\from) + ((\to) - (\from)) / 2 + 1, \to 184 .endif 185 .endm 186 187 .macro _for var:req, from:req, to:req, insn:vararg 188 .macro _for__body \var:req 189 \insn 190 .endm 191 192 __for \from, \to 193 194 .purgem _for__body 195 .endm 196 197 .macro sve_save nxbase, xpfpsr, nxtmp 198 _for n, 0, 31, _sve_str_v \n, \nxbase, \n - 34 199 _for n, 0, 15, _sve_str_p \n, \nxbase, \n - 16 200 _sve_rdffr 0 201 _sve_str_p 0, \nxbase 202 _sve_ldr_p 0, \nxbase, -16 203 204 mrs x\nxtmp, fpsr 205 str w\nxtmp, [\xpfpsr] 206 mrs x\nxtmp, fpcr 207 str w\nxtmp, [\xpfpsr, #4] 208 .endm 209 210 .macro sve_load nxbase, xpfpsr, xvqminus1, nxtmp 211 mrs_s x\nxtmp, SYS_ZCR_EL1 212 bic x\nxtmp, x\nxtmp, ZCR_ELx_LEN_MASK 213 orr x\nxtmp, x\nxtmp, \xvqminus1 214 msr_s SYS_ZCR_EL1, x\nxtmp // self-synchronising 215 216 _for n, 0, 31, _sve_ldr_v \n, \nxbase, \n - 34 217 _sve_ldr_p 0, \nxbase 218 _sve_wrffr 0 219 _for n, 0, 15, _sve_ldr_p \n, \nxbase, \n - 16 220 221 ldr w\nxtmp, [\xpfpsr] 222 msr fpsr, x\nxtmp 223 ldr w\nxtmp, [\xpfpsr, #4] 224 msr fpcr, x\nxtmp 225 .endm 226