15b0b14e5SHuacai Chen /* SPDX-License-Identifier: GPL-2.0 */
25b0b14e5SHuacai Chen /*
35b0b14e5SHuacai Chen * Copyright (C) 2020-2022 Loongson Technology Corporation Limited
45b0b14e5SHuacai Chen */
55b0b14e5SHuacai Chen #ifndef __ASM_PERCPU_H
65b0b14e5SHuacai Chen #define __ASM_PERCPU_H
75b0b14e5SHuacai Chen
846859ac8SHuacai Chen #include <asm/cmpxchg.h>
9255b4658SHuacai Chen #include <asm/loongarch.h>
1046859ac8SHuacai Chen
1111cd8a64SXi Ruoyao /*
1211cd8a64SXi Ruoyao * The "address" (in fact, offset from $r21) of a per-CPU variable is close to
1311cd8a64SXi Ruoyao * the loading address of main kernel image, but far from where the modules are
1411cd8a64SXi Ruoyao * loaded. Tell the compiler this fact when using explicit relocs.
1511cd8a64SXi Ruoyao */
1611cd8a64SXi Ruoyao #if defined(MODULE) && defined(CONFIG_AS_HAS_EXPLICIT_RELOCS)
1738b10b26SWANG Xuerui # if __has_attribute(model)
1811cd8a64SXi Ruoyao # define PER_CPU_ATTRIBUTES __attribute__((model("extreme")))
1938b10b26SWANG Xuerui # else
2038b10b26SWANG Xuerui # error compiler support for the model attribute is necessary when a recent assembler is used
2138b10b26SWANG Xuerui # endif
2211cd8a64SXi Ruoyao #endif
2311cd8a64SXi Ruoyao
245b0b14e5SHuacai Chen /* Use r21 for fast access */
255b0b14e5SHuacai Chen register unsigned long __my_cpu_offset __asm__("$r21");
265b0b14e5SHuacai Chen
set_my_cpu_offset(unsigned long off)275b0b14e5SHuacai Chen static inline void set_my_cpu_offset(unsigned long off)
285b0b14e5SHuacai Chen {
295b0b14e5SHuacai Chen __my_cpu_offset = off;
305b0b14e5SHuacai Chen csr_write64(off, PERCPU_BASE_KS);
315b0b14e5SHuacai Chen }
32c87e12e0SHuacai Chen
33c87e12e0SHuacai Chen #define __my_cpu_offset \
34c87e12e0SHuacai Chen ({ \
35c87e12e0SHuacai Chen __asm__ __volatile__("":"+r"(__my_cpu_offset)); \
36c87e12e0SHuacai Chen __my_cpu_offset; \
37c87e12e0SHuacai Chen })
385b0b14e5SHuacai Chen
3946859ac8SHuacai Chen #define PERCPU_OP(op, asm_op, c_op) \
4071945968SNathan Chancellor static __always_inline unsigned long __percpu_##op(void *ptr, \
4146859ac8SHuacai Chen unsigned long val, int size) \
4246859ac8SHuacai Chen { \
4346859ac8SHuacai Chen unsigned long ret; \
4446859ac8SHuacai Chen \
4546859ac8SHuacai Chen switch (size) { \
4646859ac8SHuacai Chen case 4: \
4746859ac8SHuacai Chen __asm__ __volatile__( \
4846859ac8SHuacai Chen "am"#asm_op".w" " %[ret], %[val], %[ptr] \n" \
4946859ac8SHuacai Chen : [ret] "=&r" (ret), [ptr] "+ZB"(*(u32 *)ptr) \
5046859ac8SHuacai Chen : [val] "r" (val)); \
5146859ac8SHuacai Chen break; \
5246859ac8SHuacai Chen case 8: \
5346859ac8SHuacai Chen __asm__ __volatile__( \
5446859ac8SHuacai Chen "am"#asm_op".d" " %[ret], %[val], %[ptr] \n" \
5546859ac8SHuacai Chen : [ret] "=&r" (ret), [ptr] "+ZB"(*(u64 *)ptr) \
5646859ac8SHuacai Chen : [val] "r" (val)); \
5746859ac8SHuacai Chen break; \
5846859ac8SHuacai Chen default: \
5946859ac8SHuacai Chen ret = 0; \
6046859ac8SHuacai Chen BUILD_BUG(); \
6146859ac8SHuacai Chen } \
6246859ac8SHuacai Chen \
6346859ac8SHuacai Chen return ret c_op val; \
6446859ac8SHuacai Chen }
6546859ac8SHuacai Chen
6646859ac8SHuacai Chen PERCPU_OP(add, add, +)
6746859ac8SHuacai Chen PERCPU_OP(and, and, &)
6846859ac8SHuacai Chen PERCPU_OP(or, or, |)
6946859ac8SHuacai Chen #undef PERCPU_OP
7046859ac8SHuacai Chen
__percpu_xchg(void * ptr,unsigned long val,int size)71ee2daf71SHuacai Chen static __always_inline unsigned long __percpu_xchg(void *ptr, unsigned long val, int size)
7246859ac8SHuacai Chen {
7346859ac8SHuacai Chen switch (size) {
74720dc7abSHuacai Chen case 1:
75720dc7abSHuacai Chen case 2:
76720dc7abSHuacai Chen return __xchg_small((volatile void *)ptr, val, size);
77720dc7abSHuacai Chen
7846859ac8SHuacai Chen case 4:
7946859ac8SHuacai Chen return __xchg_asm("amswap.w", (volatile u32 *)ptr, (u32)val);
8046859ac8SHuacai Chen
8146859ac8SHuacai Chen case 8:
8246859ac8SHuacai Chen return __xchg_asm("amswap.d", (volatile u64 *)ptr, (u64)val);
8346859ac8SHuacai Chen
8446859ac8SHuacai Chen default:
8546859ac8SHuacai Chen BUILD_BUG();
8646859ac8SHuacai Chen }
8746859ac8SHuacai Chen
8846859ac8SHuacai Chen return 0;
8946859ac8SHuacai Chen }
9046859ac8SHuacai Chen
91*d4f31acfSUros Bizjak #define __pcpu_op_1(op) op ".b "
92*d4f31acfSUros Bizjak #define __pcpu_op_2(op) op ".h "
93*d4f31acfSUros Bizjak #define __pcpu_op_4(op) op ".w "
94*d4f31acfSUros Bizjak #define __pcpu_op_8(op) op ".d "
95*d4f31acfSUros Bizjak
96*d4f31acfSUros Bizjak #define _percpu_read(size, _pcp) \
97*d4f31acfSUros Bizjak ({ \
98*d4f31acfSUros Bizjak typeof(_pcp) __pcp_ret; \
99*d4f31acfSUros Bizjak \
100*d4f31acfSUros Bizjak __asm__ __volatile__( \
101*d4f31acfSUros Bizjak __pcpu_op_##size("ldx") "%[ret], $r21, %[ptr] \n" \
102*d4f31acfSUros Bizjak : [ret] "=&r"(__pcp_ret) \
103*d4f31acfSUros Bizjak : [ptr] "r"(&(_pcp)) \
104*d4f31acfSUros Bizjak : "memory"); \
105*d4f31acfSUros Bizjak \
106*d4f31acfSUros Bizjak __pcp_ret; \
107*d4f31acfSUros Bizjak })
108*d4f31acfSUros Bizjak
109*d4f31acfSUros Bizjak #define _percpu_write(size, _pcp, _val) \
110*d4f31acfSUros Bizjak do { \
111*d4f31acfSUros Bizjak __asm__ __volatile__( \
112*d4f31acfSUros Bizjak __pcpu_op_##size("stx") "%[val], $r21, %[ptr] \n" \
113*d4f31acfSUros Bizjak : \
114*d4f31acfSUros Bizjak : [val] "r"(_val), [ptr] "r"(&(_pcp)) \
115*d4f31acfSUros Bizjak : "memory"); \
116*d4f31acfSUros Bizjak } while (0)
117*d4f31acfSUros Bizjak
11846859ac8SHuacai Chen /* this_cpu_cmpxchg */
11946859ac8SHuacai Chen #define _protect_cmpxchg_local(pcp, o, n) \
12046859ac8SHuacai Chen ({ \
12146859ac8SHuacai Chen typeof(*raw_cpu_ptr(&(pcp))) __ret; \
12246859ac8SHuacai Chen preempt_disable_notrace(); \
12346859ac8SHuacai Chen __ret = cmpxchg_local(raw_cpu_ptr(&(pcp)), o, n); \
12446859ac8SHuacai Chen preempt_enable_notrace(); \
12546859ac8SHuacai Chen __ret; \
12646859ac8SHuacai Chen })
12746859ac8SHuacai Chen
12846859ac8SHuacai Chen #define _pcp_protect(operation, pcp, val) \
12946859ac8SHuacai Chen ({ \
13046859ac8SHuacai Chen typeof(pcp) __retval; \
13146859ac8SHuacai Chen preempt_disable_notrace(); \
13246859ac8SHuacai Chen __retval = (typeof(pcp))operation(raw_cpu_ptr(&(pcp)), \
13346859ac8SHuacai Chen (val), sizeof(pcp)); \
13446859ac8SHuacai Chen preempt_enable_notrace(); \
13546859ac8SHuacai Chen __retval; \
13646859ac8SHuacai Chen })
13746859ac8SHuacai Chen
13846859ac8SHuacai Chen #define _percpu_add(pcp, val) \
13946859ac8SHuacai Chen _pcp_protect(__percpu_add, pcp, val)
14046859ac8SHuacai Chen
14146859ac8SHuacai Chen #define _percpu_add_return(pcp, val) _percpu_add(pcp, val)
14246859ac8SHuacai Chen
14346859ac8SHuacai Chen #define _percpu_and(pcp, val) \
14446859ac8SHuacai Chen _pcp_protect(__percpu_and, pcp, val)
14546859ac8SHuacai Chen
14646859ac8SHuacai Chen #define _percpu_or(pcp, val) \
14746859ac8SHuacai Chen _pcp_protect(__percpu_or, pcp, val)
14846859ac8SHuacai Chen
14946859ac8SHuacai Chen #define _percpu_xchg(pcp, val) ((typeof(pcp)) \
15046859ac8SHuacai Chen _pcp_protect(__percpu_xchg, pcp, (unsigned long)(val)))
15146859ac8SHuacai Chen
15246859ac8SHuacai Chen #define this_cpu_add_4(pcp, val) _percpu_add(pcp, val)
15346859ac8SHuacai Chen #define this_cpu_add_8(pcp, val) _percpu_add(pcp, val)
15446859ac8SHuacai Chen
15546859ac8SHuacai Chen #define this_cpu_add_return_4(pcp, val) _percpu_add_return(pcp, val)
15646859ac8SHuacai Chen #define this_cpu_add_return_8(pcp, val) _percpu_add_return(pcp, val)
15746859ac8SHuacai Chen
15846859ac8SHuacai Chen #define this_cpu_and_4(pcp, val) _percpu_and(pcp, val)
15946859ac8SHuacai Chen #define this_cpu_and_8(pcp, val) _percpu_and(pcp, val)
16046859ac8SHuacai Chen
16146859ac8SHuacai Chen #define this_cpu_or_4(pcp, val) _percpu_or(pcp, val)
16246859ac8SHuacai Chen #define this_cpu_or_8(pcp, val) _percpu_or(pcp, val)
16346859ac8SHuacai Chen
164*d4f31acfSUros Bizjak #define this_cpu_read_1(pcp) _percpu_read(1, pcp)
165*d4f31acfSUros Bizjak #define this_cpu_read_2(pcp) _percpu_read(2, pcp)
166*d4f31acfSUros Bizjak #define this_cpu_read_4(pcp) _percpu_read(4, pcp)
167*d4f31acfSUros Bizjak #define this_cpu_read_8(pcp) _percpu_read(8, pcp)
16846859ac8SHuacai Chen
169*d4f31acfSUros Bizjak #define this_cpu_write_1(pcp, val) _percpu_write(1, pcp, val)
170*d4f31acfSUros Bizjak #define this_cpu_write_2(pcp, val) _percpu_write(2, pcp, val)
171*d4f31acfSUros Bizjak #define this_cpu_write_4(pcp, val) _percpu_write(4, pcp, val)
172*d4f31acfSUros Bizjak #define this_cpu_write_8(pcp, val) _percpu_write(8, pcp, val)
17346859ac8SHuacai Chen
174720dc7abSHuacai Chen #define this_cpu_xchg_1(pcp, val) _percpu_xchg(pcp, val)
175720dc7abSHuacai Chen #define this_cpu_xchg_2(pcp, val) _percpu_xchg(pcp, val)
17646859ac8SHuacai Chen #define this_cpu_xchg_4(pcp, val) _percpu_xchg(pcp, val)
17746859ac8SHuacai Chen #define this_cpu_xchg_8(pcp, val) _percpu_xchg(pcp, val)
17846859ac8SHuacai Chen
179720dc7abSHuacai Chen #define this_cpu_cmpxchg_1(ptr, o, n) _protect_cmpxchg_local(ptr, o, n)
180720dc7abSHuacai Chen #define this_cpu_cmpxchg_2(ptr, o, n) _protect_cmpxchg_local(ptr, o, n)
18146859ac8SHuacai Chen #define this_cpu_cmpxchg_4(ptr, o, n) _protect_cmpxchg_local(ptr, o, n)
18246859ac8SHuacai Chen #define this_cpu_cmpxchg_8(ptr, o, n) _protect_cmpxchg_local(ptr, o, n)
18346859ac8SHuacai Chen
1845b0b14e5SHuacai Chen #include <asm-generic/percpu.h>
1855b0b14e5SHuacai Chen
1865b0b14e5SHuacai Chen #endif /* __ASM_PERCPU_H */
187