Commit | Line | Data |
---|---|---|
0be7320a | 1 | /* |
7b7293ae | 2 | * Based on arch/arm/include/asm/assembler.h, arch/arm/mm/proc-macros.S |
0be7320a CM |
3 | * |
4 | * Copyright (C) 1996-2000 Russell King | |
5 | * Copyright (C) 2012 ARM Ltd. | |
6 | * | |
7 | * This program is free software; you can redistribute it and/or modify | |
8 | * it under the terms of the GNU General Public License version 2 as | |
9 | * published by the Free Software Foundation. | |
10 | * | |
11 | * This program is distributed in the hope that it will be useful, | |
12 | * but WITHOUT ANY WARRANTY; without even the implied warranty of | |
13 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | |
14 | * GNU General Public License for more details. | |
15 | * | |
16 | * You should have received a copy of the GNU General Public License | |
17 | * along with this program. If not, see <http://www.gnu.org/licenses/>. | |
18 | */ | |
19 | #ifndef __ASSEMBLY__ | |
20 | #error "Only include this from assembly code" | |
21 | #endif | |
22 | ||
f3e39273 MZ |
23 | #ifndef __ASM_ASSEMBLER_H |
24 | #define __ASM_ASSEMBLER_H | |
25 | ||
7b7293ae | 26 | #include <asm/asm-offsets.h> |
823066d9 | 27 | #include <asm/cpufeature.h> |
5003dbde | 28 | #include <asm/page.h> |
7b7293ae | 29 | #include <asm/pgtable-hwdef.h> |
0be7320a | 30 | #include <asm/ptrace.h> |
2a283070 | 31 | #include <asm/thread_info.h> |
0be7320a | 32 | |
0be7320a CM |
33 | /* |
34 | * Enable and disable interrupts. | |
35 | */ | |
36 | .macro disable_irq | |
37 | msr daifset, #2 | |
38 | .endm | |
39 | ||
40 | .macro enable_irq | |
41 | msr daifclr, #2 | |
42 | .endm | |
43 | ||
0be7320a CM |
44 | /* |
45 | * Enable and disable debug exceptions. | |
46 | */ | |
47 | .macro disable_dbg | |
48 | msr daifset, #8 | |
49 | .endm | |
50 | ||
51 | .macro enable_dbg | |
52 | msr daifclr, #8 | |
53 | .endm | |
54 | ||
2a283070 WD |
55 | .macro disable_step_tsk, flgs, tmp |
56 | tbz \flgs, #TIF_SINGLESTEP, 9990f | |
0be7320a CM |
57 | mrs \tmp, mdscr_el1 |
58 | bic \tmp, \tmp, #1 | |
59 | msr mdscr_el1, \tmp | |
2a283070 WD |
60 | isb // Synchronise with enable_dbg |
61 | 9990: | |
0be7320a CM |
62 | .endm |
63 | ||
2a283070 WD |
64 | .macro enable_step_tsk, flgs, tmp |
65 | tbz \flgs, #TIF_SINGLESTEP, 9990f | |
66 | disable_dbg | |
0be7320a CM |
67 | mrs \tmp, mdscr_el1 |
68 | orr \tmp, \tmp, #1 | |
69 | msr mdscr_el1, \tmp | |
2a283070 | 70 | 9990: |
0be7320a CM |
71 | .endm |
72 | ||
2a283070 WD |
73 | /* |
74 | * Enable both debug exceptions and interrupts. This is likely to be | |
75 | * faster than two daifclr operations, since writes to this register | |
76 | * are self-synchronising. | |
77 | */ | |
78 | .macro enable_dbg_and_irq | |
79 | msr daifclr, #(8 | 2) | |
0be7320a CM |
80 | .endm |
81 | ||
82 | /* | |
83 | * SMP data memory barrier | |
84 | */ | |
85 | .macro smp_dmb, opt | |
0be7320a | 86 | dmb \opt |
0be7320a CM |
87 | .endm |
88 | ||
f99a250c WD |
89 | /* |
90 | * NOP sequence | |
91 | */ | |
92 | .macro nops, num | |
93 | .rept \num | |
94 | nop | |
95 | .endr | |
96 | .endm | |
97 | ||
6c94f27a AB |
98 | /* |
99 | * Emit an entry into the exception table | |
100 | */ | |
101 | .macro _asm_extable, from, to | |
102 | .pushsection __ex_table, "a" | |
103 | .align 3 | |
104 | .long (\from - .), (\to - .) | |
105 | .popsection | |
106 | .endm | |
107 | ||
0be7320a CM |
108 | #define USER(l, x...) \ |
109 | 9999: x; \ | |
6c94f27a | 110 | _asm_extable 9999b, l |
0be7320a CM |
111 | |
112 | /* | |
113 | * Register aliases. | |
114 | */ | |
115 | lr .req x30 // link register | |
dc637f1f MZ |
116 | |
117 | /* | |
118 | * Vector entry | |
119 | */ | |
120 | .macro ventry label | |
121 | .align 7 | |
122 | b \label | |
123 | .endm | |
e68bedaa ML |
124 | |
125 | /* | |
126 | * Select code when configured for BE. | |
127 | */ | |
128 | #ifdef CONFIG_CPU_BIG_ENDIAN | |
129 | #define CPU_BE(code...) code | |
130 | #else | |
131 | #define CPU_BE(code...) | |
132 | #endif | |
133 | ||
134 | /* | |
135 | * Select code when configured for LE. | |
136 | */ | |
137 | #ifdef CONFIG_CPU_BIG_ENDIAN | |
138 | #define CPU_LE(code...) | |
139 | #else | |
140 | #define CPU_LE(code...) code | |
141 | #endif | |
142 | ||
55b89540 ML |
143 | /* |
144 | * Define a macro that constructs a 64-bit value by concatenating two | |
145 | * 32-bit registers. Note that on big endian systems the order of the | |
146 | * registers is swapped. | |
147 | */ | |
148 | #ifndef CONFIG_CPU_BIG_ENDIAN | |
149 | .macro regs_to_64, rd, lbits, hbits | |
150 | #else | |
151 | .macro regs_to_64, rd, hbits, lbits | |
152 | #endif | |
153 | orr \rd, \lbits, \hbits, lsl #32 | |
154 | .endm | |
f3e39273 | 155 | |
b784a5d9 AB |
156 | /* |
157 | * Pseudo-ops for PC-relative adr/ldr/str <reg>, <symbol> where | |
158 | * <symbol> is within the range +/- 4 GB of the PC. | |
159 | */ | |
160 | /* | |
161 | * @dst: destination register (64 bit wide) | |
162 | * @sym: name of the symbol | |
163 | * @tmp: optional scratch register to be used if <dst> == sp, which | |
164 | * is not allowed in an adrp instruction | |
165 | */ | |
166 | .macro adr_l, dst, sym, tmp= | |
167 | .ifb \tmp | |
168 | adrp \dst, \sym | |
169 | add \dst, \dst, :lo12:\sym | |
170 | .else | |
171 | adrp \tmp, \sym | |
172 | add \dst, \tmp, :lo12:\sym | |
173 | .endif | |
174 | .endm | |
175 | ||
176 | /* | |
177 | * @dst: destination register (32 or 64 bit wide) | |
178 | * @sym: name of the symbol | |
179 | * @tmp: optional 64-bit scratch register to be used if <dst> is a | |
180 | * 32-bit wide register, in which case it cannot be used to hold | |
181 | * the address | |
182 | */ | |
183 | .macro ldr_l, dst, sym, tmp= | |
184 | .ifb \tmp | |
185 | adrp \dst, \sym | |
186 | ldr \dst, [\dst, :lo12:\sym] | |
187 | .else | |
188 | adrp \tmp, \sym | |
189 | ldr \dst, [\tmp, :lo12:\sym] | |
190 | .endif | |
191 | .endm | |
192 | ||
193 | /* | |
194 | * @src: source register (32 or 64 bit wide) | |
195 | * @sym: name of the symbol | |
196 | * @tmp: mandatory 64-bit scratch register to calculate the address | |
197 | * while <src> needs to be preserved. | |
198 | */ | |
199 | .macro str_l, src, sym, tmp | |
200 | adrp \tmp, \sym | |
201 | str \src, [\tmp, :lo12:\sym] | |
202 | .endm | |
203 | ||
aa4d5d3c JM |
204 | /* |
205 | * @sym: The name of the per-cpu variable | |
206 | * @reg: Result of per_cpu(sym, smp_processor_id()) | |
207 | * @tmp: scratch register | |
208 | */ | |
209 | .macro this_cpu_ptr, sym, reg, tmp | |
210 | adr_l \reg, \sym | |
211 | mrs \tmp, tpidr_el1 | |
212 | add \reg, \reg, \tmp | |
213 | .endm | |
214 | ||
7b7293ae GL |
215 | /* |
216 | * vma_vm_mm - get mm pointer from vma pointer (vma->vm_mm) | |
217 | */ | |
218 | .macro vma_vm_mm, rd, rn | |
219 | ldr \rd, [\rn, #VMA_VM_MM] | |
220 | .endm | |
221 | ||
222 | /* | |
223 | * mmid - get context id from mm pointer (mm->context.id) | |
224 | */ | |
225 | .macro mmid, rd, rn | |
226 | ldr \rd, [\rn, #MM_CONTEXT_ID] | |
227 | .endm | |
116c81f4 SP |
228 | /* |
229 | * read_ctr - read CTR_EL0. If the system has mismatched | |
230 | * cache line sizes, provide the system wide safe value | |
231 | * from arm64_ftr_reg_ctrel0.sys_val | |
232 | */ | |
233 | .macro read_ctr, reg | |
234 | alternative_if_not ARM64_MISMATCHED_CACHE_LINE_SIZE | |
235 | mrs \reg, ctr_el0 // read CTR | |
236 | nop | |
237 | alternative_else | |
238 | ldr_l \reg, arm64_ftr_reg_ctrel0 + ARM64_FTR_SYSVAL | |
239 | alternative_endif | |
240 | .endm | |
241 | ||
7b7293ae GL |
242 | |
243 | /* | |
072f0a63 SP |
244 | * raw_dcache_line_size - get the minimum D-cache line size on this CPU |
245 | * from the CTR register. | |
7b7293ae | 246 | */ |
072f0a63 | 247 | .macro raw_dcache_line_size, reg, tmp |
7b7293ae GL |
248 | mrs \tmp, ctr_el0 // read CTR |
249 | ubfm \tmp, \tmp, #16, #19 // cache line size encoding | |
250 | mov \reg, #4 // bytes per word | |
251 | lsl \reg, \reg, \tmp // actual cache line size | |
252 | .endm | |
253 | ||
254 | /* | |
072f0a63 | 255 | * dcache_line_size - get the safe D-cache line size across all CPUs |
7b7293ae | 256 | */ |
072f0a63 | 257 | .macro dcache_line_size, reg, tmp |
116c81f4 SP |
258 | read_ctr \tmp |
259 | ubfm \tmp, \tmp, #16, #19 // cache line size encoding | |
260 | mov \reg, #4 // bytes per word | |
261 | lsl \reg, \reg, \tmp // actual cache line size | |
072f0a63 SP |
262 | .endm |
263 | ||
264 | /* | |
265 | * raw_icache_line_size - get the minimum I-cache line size on this CPU | |
266 | * from the CTR register. | |
267 | */ | |
268 | .macro raw_icache_line_size, reg, tmp | |
7b7293ae GL |
269 | mrs \tmp, ctr_el0 // read CTR |
270 | and \tmp, \tmp, #0xf // cache line size encoding | |
271 | mov \reg, #4 // bytes per word | |
272 | lsl \reg, \reg, \tmp // actual cache line size | |
273 | .endm | |
274 | ||
072f0a63 SP |
275 | /* |
276 | * icache_line_size - get the safe I-cache line size across all CPUs | |
277 | */ | |
278 | .macro icache_line_size, reg, tmp | |
116c81f4 SP |
279 | read_ctr \tmp |
280 | and \tmp, \tmp, #0xf // cache line size encoding | |
281 | mov \reg, #4 // bytes per word | |
282 | lsl \reg, \reg, \tmp // actual cache line size | |
072f0a63 SP |
283 | .endm |
284 | ||
7b7293ae GL |
285 | /* |
286 | * tcr_set_idmap_t0sz - update TCR.T0SZ so that we can load the ID map | |
287 | */ | |
288 | .macro tcr_set_idmap_t0sz, valreg, tmpreg | |
289 | #ifndef CONFIG_ARM64_VA_BITS_48 | |
290 | ldr_l \tmpreg, idmap_t0sz | |
291 | bfi \valreg, \tmpreg, #TCR_T0SZ_OFFSET, #TCR_TxSZ_WIDTH | |
292 | #endif | |
293 | .endm | |
294 | ||
295 | /* | |
296 | * Macro to perform a data cache maintenance for the interval | |
297 | * [kaddr, kaddr + size) | |
298 | * | |
299 | * op: operation passed to dc instruction | |
300 | * domain: domain used in dsb instruciton | |
301 | * kaddr: starting virtual address of the region | |
302 | * size: size of the region | |
303 | * Corrupts: kaddr, size, tmp1, tmp2 | |
304 | */ | |
305 | .macro dcache_by_line_op op, domain, kaddr, size, tmp1, tmp2 | |
306 | dcache_line_size \tmp1, \tmp2 | |
307 | add \size, \kaddr, \size | |
308 | sub \tmp2, \tmp1, #1 | |
309 | bic \kaddr, \kaddr, \tmp2 | |
823066d9 AP |
310 | 9998: |
311 | .if (\op == cvau || \op == cvac) | |
312 | alternative_if_not ARM64_WORKAROUND_CLEAN_CACHE | |
313 | dc \op, \kaddr | |
314 | alternative_else | |
315 | dc civac, \kaddr | |
316 | alternative_endif | |
317 | .else | |
318 | dc \op, \kaddr | |
319 | .endif | |
7b7293ae GL |
320 | add \kaddr, \kaddr, \tmp1 |
321 | cmp \kaddr, \size | |
322 | b.lo 9998b | |
323 | dsb \domain | |
324 | .endm | |
325 | ||
326 | /* | |
327 | * reset_pmuserenr_el0 - reset PMUSERENR_EL0 if PMUv3 present | |
328 | */ | |
329 | .macro reset_pmuserenr_el0, tmpreg | |
330 | mrs \tmpreg, id_aa64dfr0_el1 // Check ID_AA64DFR0_EL1 PMUVer | |
331 | sbfx \tmpreg, \tmpreg, #8, #4 | |
332 | cmp \tmpreg, #1 // Skip if no PMU present | |
333 | b.lt 9000f | |
334 | msr pmuserenr_el0, xzr // Disable PMU access from EL0 | |
335 | 9000: | |
336 | .endm | |
337 | ||
5003dbde GL |
338 | /* |
339 | * copy_page - copy src to dest using temp registers t1-t8 | |
340 | */ | |
341 | .macro copy_page dest:req src:req t1:req t2:req t3:req t4:req t5:req t6:req t7:req t8:req | |
342 | 9998: ldp \t1, \t2, [\src] | |
343 | ldp \t3, \t4, [\src, #16] | |
344 | ldp \t5, \t6, [\src, #32] | |
345 | ldp \t7, \t8, [\src, #48] | |
346 | add \src, \src, #64 | |
347 | stnp \t1, \t2, [\dest] | |
348 | stnp \t3, \t4, [\dest, #16] | |
349 | stnp \t5, \t6, [\dest, #32] | |
350 | stnp \t7, \t8, [\dest, #48] | |
351 | add \dest, \dest, #64 | |
352 | tst \src, #(PAGE_SIZE - 1) | |
353 | b.ne 9998b | |
354 | .endm | |
355 | ||
20791846 AB |
356 | /* |
357 | * Annotate a function as position independent, i.e., safe to be called before | |
358 | * the kernel virtual mapping is activated. | |
359 | */ | |
360 | #define ENDPIPROC(x) \ | |
361 | .globl __pi_##x; \ | |
362 | .type __pi_##x, %function; \ | |
363 | .set __pi_##x, x; \ | |
364 | .size __pi_##x, . - x; \ | |
365 | ENDPROC(x) | |
366 | ||
6ad1fe5d AB |
367 | /* |
368 | * Emit a 64-bit absolute little endian symbol reference in a way that | |
369 | * ensures that it will be resolved at build time, even when building a | |
370 | * PIE binary. This requires cooperation from the linker script, which | |
371 | * must emit the lo32/hi32 halves individually. | |
372 | */ | |
373 | .macro le64sym, sym | |
374 | .long \sym\()_lo32 | |
375 | .long \sym\()_hi32 | |
376 | .endm | |
377 | ||
30b5ba5c AB |
378 | /* |
379 | * mov_q - move an immediate constant into a 64-bit register using | |
380 | * between 2 and 4 movz/movk instructions (depending on the | |
381 | * magnitude and sign of the operand) | |
382 | */ | |
383 | .macro mov_q, reg, val | |
384 | .if (((\val) >> 31) == 0 || ((\val) >> 31) == 0x1ffffffff) | |
385 | movz \reg, :abs_g1_s:\val | |
386 | .else | |
387 | .if (((\val) >> 47) == 0 || ((\val) >> 47) == 0x1ffff) | |
388 | movz \reg, :abs_g2_s:\val | |
389 | .else | |
390 | movz \reg, :abs_g3:\val | |
391 | movk \reg, :abs_g2_nc:\val | |
392 | .endif | |
393 | movk \reg, :abs_g1_nc:\val | |
394 | .endif | |
395 | movk \reg, :abs_g0_nc:\val | |
396 | .endm | |
397 | ||
f3e39273 | 398 | #endif /* __ASM_ASSEMBLER_H */ |