xref: /openbmc/linux/arch/loongarch/include/asm/percpu.h (revision 46eeaa11bdd1bc9e077bdf741d32ca7235d263c6)
15b0b14e5SHuacai Chen /* SPDX-License-Identifier: GPL-2.0 */
25b0b14e5SHuacai Chen /*
35b0b14e5SHuacai Chen  * Copyright (C) 2020-2022 Loongson Technology Corporation Limited
45b0b14e5SHuacai Chen  */
55b0b14e5SHuacai Chen #ifndef __ASM_PERCPU_H
65b0b14e5SHuacai Chen #define __ASM_PERCPU_H
75b0b14e5SHuacai Chen 
846859ac8SHuacai Chen #include <asm/cmpxchg.h>
9255b4658SHuacai Chen #include <asm/loongarch.h>
1046859ac8SHuacai Chen 
1111cd8a64SXi Ruoyao /*
1211cd8a64SXi Ruoyao  * The "address" (in fact, offset from $r21) of a per-CPU variable is close to
1311cd8a64SXi Ruoyao  * the loading address of main kernel image, but far from where the modules are
1411cd8a64SXi Ruoyao  * loaded. Tell the compiler this fact when using explicit relocs.
1511cd8a64SXi Ruoyao  */
1611cd8a64SXi Ruoyao #if defined(MODULE) && defined(CONFIG_AS_HAS_EXPLICIT_RELOCS)
1738b10b26SWANG Xuerui # if __has_attribute(model)
1811cd8a64SXi Ruoyao #  define PER_CPU_ATTRIBUTES __attribute__((model("extreme")))
1938b10b26SWANG Xuerui # else
2038b10b26SWANG Xuerui #  error compiler support for the model attribute is necessary when a recent assembler is used
2138b10b26SWANG Xuerui # endif
2211cd8a64SXi Ruoyao #endif
2311cd8a64SXi Ruoyao 
245b0b14e5SHuacai Chen /* Use r21 for fast access */
255b0b14e5SHuacai Chen register unsigned long __my_cpu_offset __asm__("$r21");
265b0b14e5SHuacai Chen 
set_my_cpu_offset(unsigned long off)275b0b14e5SHuacai Chen static inline void set_my_cpu_offset(unsigned long off)
285b0b14e5SHuacai Chen {
295b0b14e5SHuacai Chen 	__my_cpu_offset = off;
305b0b14e5SHuacai Chen 	csr_write64(off, PERCPU_BASE_KS);
315b0b14e5SHuacai Chen }
32*f3f5d7a5SHuacai Chen 
33*f3f5d7a5SHuacai Chen #define __my_cpu_offset					\
34*f3f5d7a5SHuacai Chen ({							\
35*f3f5d7a5SHuacai Chen 	__asm__ __volatile__("":"+r"(__my_cpu_offset));	\
36*f3f5d7a5SHuacai Chen 	__my_cpu_offset;				\
37*f3f5d7a5SHuacai Chen })
385b0b14e5SHuacai Chen 
3946859ac8SHuacai Chen #define PERCPU_OP(op, asm_op, c_op)					\
40cff8bf67SNathan Chancellor static __always_inline unsigned long __percpu_##op(void *ptr,		\
4146859ac8SHuacai Chen 			unsigned long val, int size)			\
4246859ac8SHuacai Chen {									\
4346859ac8SHuacai Chen 	unsigned long ret;						\
4446859ac8SHuacai Chen 									\
4546859ac8SHuacai Chen 	switch (size) {							\
4646859ac8SHuacai Chen 	case 4:								\
4746859ac8SHuacai Chen 		__asm__ __volatile__(					\
4846859ac8SHuacai Chen 		"am"#asm_op".w"	" %[ret], %[val], %[ptr]	\n"		\
4946859ac8SHuacai Chen 		: [ret] "=&r" (ret), [ptr] "+ZB"(*(u32 *)ptr)		\
5046859ac8SHuacai Chen 		: [val] "r" (val));					\
5146859ac8SHuacai Chen 		break;							\
5246859ac8SHuacai Chen 	case 8:								\
5346859ac8SHuacai Chen 		__asm__ __volatile__(					\
5446859ac8SHuacai Chen 		"am"#asm_op".d" " %[ret], %[val], %[ptr]	\n"		\
5546859ac8SHuacai Chen 		: [ret] "=&r" (ret), [ptr] "+ZB"(*(u64 *)ptr)		\
5646859ac8SHuacai Chen 		: [val] "r" (val));					\
5746859ac8SHuacai Chen 		break;							\
5846859ac8SHuacai Chen 	default:							\
5946859ac8SHuacai Chen 		ret = 0;						\
6046859ac8SHuacai Chen 		BUILD_BUG();						\
6146859ac8SHuacai Chen 	}								\
6246859ac8SHuacai Chen 									\
6346859ac8SHuacai Chen 	return ret c_op val;						\
6446859ac8SHuacai Chen }
6546859ac8SHuacai Chen 
6646859ac8SHuacai Chen PERCPU_OP(add, add, +)
6746859ac8SHuacai Chen PERCPU_OP(and, and, &)
6846859ac8SHuacai Chen PERCPU_OP(or, or, |)
6946859ac8SHuacai Chen #undef PERCPU_OP
7046859ac8SHuacai Chen 
__percpu_read(void * ptr,int size)71cff8bf67SNathan Chancellor static __always_inline unsigned long __percpu_read(void *ptr, int size)
7246859ac8SHuacai Chen {
7346859ac8SHuacai Chen 	unsigned long ret;
7446859ac8SHuacai Chen 
7546859ac8SHuacai Chen 	switch (size) {
7646859ac8SHuacai Chen 	case 1:
7746859ac8SHuacai Chen 		__asm__ __volatile__ ("ldx.b %[ret], $r21, %[ptr]	\n"
7846859ac8SHuacai Chen 		: [ret] "=&r"(ret)
7946859ac8SHuacai Chen 		: [ptr] "r"(ptr)
8046859ac8SHuacai Chen 		: "memory");
8146859ac8SHuacai Chen 		break;
8246859ac8SHuacai Chen 	case 2:
8346859ac8SHuacai Chen 		__asm__ __volatile__ ("ldx.h %[ret], $r21, %[ptr]	\n"
8446859ac8SHuacai Chen 		: [ret] "=&r"(ret)
8546859ac8SHuacai Chen 		: [ptr] "r"(ptr)
8646859ac8SHuacai Chen 		: "memory");
8746859ac8SHuacai Chen 		break;
8846859ac8SHuacai Chen 	case 4:
8946859ac8SHuacai Chen 		__asm__ __volatile__ ("ldx.w %[ret], $r21, %[ptr]	\n"
9046859ac8SHuacai Chen 		: [ret] "=&r"(ret)
9146859ac8SHuacai Chen 		: [ptr] "r"(ptr)
9246859ac8SHuacai Chen 		: "memory");
9346859ac8SHuacai Chen 		break;
9446859ac8SHuacai Chen 	case 8:
9546859ac8SHuacai Chen 		__asm__ __volatile__ ("ldx.d %[ret], $r21, %[ptr]	\n"
9646859ac8SHuacai Chen 		: [ret] "=&r"(ret)
9746859ac8SHuacai Chen 		: [ptr] "r"(ptr)
9846859ac8SHuacai Chen 		: "memory");
9946859ac8SHuacai Chen 		break;
10046859ac8SHuacai Chen 	default:
10146859ac8SHuacai Chen 		ret = 0;
10246859ac8SHuacai Chen 		BUILD_BUG();
10346859ac8SHuacai Chen 	}
10446859ac8SHuacai Chen 
10546859ac8SHuacai Chen 	return ret;
10646859ac8SHuacai Chen }
10746859ac8SHuacai Chen 
__percpu_write(void * ptr,unsigned long val,int size)108cff8bf67SNathan Chancellor static __always_inline void __percpu_write(void *ptr, unsigned long val, int size)
10946859ac8SHuacai Chen {
11046859ac8SHuacai Chen 	switch (size) {
11146859ac8SHuacai Chen 	case 1:
11246859ac8SHuacai Chen 		__asm__ __volatile__("stx.b %[val], $r21, %[ptr]	\n"
11346859ac8SHuacai Chen 		:
11446859ac8SHuacai Chen 		: [val] "r" (val), [ptr] "r" (ptr)
11546859ac8SHuacai Chen 		: "memory");
11646859ac8SHuacai Chen 		break;
11746859ac8SHuacai Chen 	case 2:
11846859ac8SHuacai Chen 		__asm__ __volatile__("stx.h %[val], $r21, %[ptr]	\n"
11946859ac8SHuacai Chen 		:
12046859ac8SHuacai Chen 		: [val] "r" (val), [ptr] "r" (ptr)
12146859ac8SHuacai Chen 		: "memory");
12246859ac8SHuacai Chen 		break;
12346859ac8SHuacai Chen 	case 4:
12446859ac8SHuacai Chen 		__asm__ __volatile__("stx.w %[val], $r21, %[ptr]	\n"
12546859ac8SHuacai Chen 		:
12646859ac8SHuacai Chen 		: [val] "r" (val), [ptr] "r" (ptr)
12746859ac8SHuacai Chen 		: "memory");
12846859ac8SHuacai Chen 		break;
12946859ac8SHuacai Chen 	case 8:
13046859ac8SHuacai Chen 		__asm__ __volatile__("stx.d %[val], $r21, %[ptr]	\n"
13146859ac8SHuacai Chen 		:
13246859ac8SHuacai Chen 		: [val] "r" (val), [ptr] "r" (ptr)
13346859ac8SHuacai Chen 		: "memory");
13446859ac8SHuacai Chen 		break;
13546859ac8SHuacai Chen 	default:
13646859ac8SHuacai Chen 		BUILD_BUG();
13746859ac8SHuacai Chen 	}
13846859ac8SHuacai Chen }
13946859ac8SHuacai Chen 
__percpu_xchg(void * ptr,unsigned long val,int size)140cff8bf67SNathan Chancellor static __always_inline unsigned long __percpu_xchg(void *ptr, unsigned long val,
14146859ac8SHuacai Chen 						   int size)
14246859ac8SHuacai Chen {
14346859ac8SHuacai Chen 	switch (size) {
144720dc7abSHuacai Chen 	case 1:
145720dc7abSHuacai Chen 	case 2:
146720dc7abSHuacai Chen 		return __xchg_small((volatile void *)ptr, val, size);
147720dc7abSHuacai Chen 
14846859ac8SHuacai Chen 	case 4:
14946859ac8SHuacai Chen 		return __xchg_asm("amswap.w", (volatile u32 *)ptr, (u32)val);
15046859ac8SHuacai Chen 
15146859ac8SHuacai Chen 	case 8:
15246859ac8SHuacai Chen 		return __xchg_asm("amswap.d", (volatile u64 *)ptr, (u64)val);
15346859ac8SHuacai Chen 
15446859ac8SHuacai Chen 	default:
15546859ac8SHuacai Chen 		BUILD_BUG();
15646859ac8SHuacai Chen 	}
15746859ac8SHuacai Chen 
15846859ac8SHuacai Chen 	return 0;
15946859ac8SHuacai Chen }
16046859ac8SHuacai Chen 
16146859ac8SHuacai Chen /* this_cpu_cmpxchg */
16246859ac8SHuacai Chen #define _protect_cmpxchg_local(pcp, o, n)			\
16346859ac8SHuacai Chen ({								\
16446859ac8SHuacai Chen 	typeof(*raw_cpu_ptr(&(pcp))) __ret;			\
16546859ac8SHuacai Chen 	preempt_disable_notrace();				\
16646859ac8SHuacai Chen 	__ret = cmpxchg_local(raw_cpu_ptr(&(pcp)), o, n);	\
16746859ac8SHuacai Chen 	preempt_enable_notrace();				\
16846859ac8SHuacai Chen 	__ret;							\
16946859ac8SHuacai Chen })
17046859ac8SHuacai Chen 
17146859ac8SHuacai Chen #define _percpu_read(pcp)						\
17246859ac8SHuacai Chen ({									\
17346859ac8SHuacai Chen 	typeof(pcp) __retval;						\
17446859ac8SHuacai Chen 	__retval = (typeof(pcp))__percpu_read(&(pcp), sizeof(pcp));	\
17546859ac8SHuacai Chen 	__retval;							\
17646859ac8SHuacai Chen })
17746859ac8SHuacai Chen 
17846859ac8SHuacai Chen #define _percpu_write(pcp, val)						\
17946859ac8SHuacai Chen do {									\
18046859ac8SHuacai Chen 	__percpu_write(&(pcp), (unsigned long)(val), sizeof(pcp));	\
18146859ac8SHuacai Chen } while (0)								\
18246859ac8SHuacai Chen 
18346859ac8SHuacai Chen #define _pcp_protect(operation, pcp, val)			\
18446859ac8SHuacai Chen ({								\
18546859ac8SHuacai Chen 	typeof(pcp) __retval;					\
18646859ac8SHuacai Chen 	preempt_disable_notrace();				\
18746859ac8SHuacai Chen 	__retval = (typeof(pcp))operation(raw_cpu_ptr(&(pcp)),	\
18846859ac8SHuacai Chen 					  (val), sizeof(pcp));	\
18946859ac8SHuacai Chen 	preempt_enable_notrace();				\
19046859ac8SHuacai Chen 	__retval;						\
19146859ac8SHuacai Chen })
19246859ac8SHuacai Chen 
19346859ac8SHuacai Chen #define _percpu_add(pcp, val) \
19446859ac8SHuacai Chen 	_pcp_protect(__percpu_add, pcp, val)
19546859ac8SHuacai Chen 
19646859ac8SHuacai Chen #define _percpu_add_return(pcp, val) _percpu_add(pcp, val)
19746859ac8SHuacai Chen 
19846859ac8SHuacai Chen #define _percpu_and(pcp, val) \
19946859ac8SHuacai Chen 	_pcp_protect(__percpu_and, pcp, val)
20046859ac8SHuacai Chen 
20146859ac8SHuacai Chen #define _percpu_or(pcp, val) \
20246859ac8SHuacai Chen 	_pcp_protect(__percpu_or, pcp, val)
20346859ac8SHuacai Chen 
20446859ac8SHuacai Chen #define _percpu_xchg(pcp, val) ((typeof(pcp)) \
20546859ac8SHuacai Chen 	_pcp_protect(__percpu_xchg, pcp, (unsigned long)(val)))
20646859ac8SHuacai Chen 
20746859ac8SHuacai Chen #define this_cpu_add_4(pcp, val) _percpu_add(pcp, val)
20846859ac8SHuacai Chen #define this_cpu_add_8(pcp, val) _percpu_add(pcp, val)
20946859ac8SHuacai Chen 
21046859ac8SHuacai Chen #define this_cpu_add_return_4(pcp, val) _percpu_add_return(pcp, val)
21146859ac8SHuacai Chen #define this_cpu_add_return_8(pcp, val) _percpu_add_return(pcp, val)
21246859ac8SHuacai Chen 
21346859ac8SHuacai Chen #define this_cpu_and_4(pcp, val) _percpu_and(pcp, val)
21446859ac8SHuacai Chen #define this_cpu_and_8(pcp, val) _percpu_and(pcp, val)
21546859ac8SHuacai Chen 
21646859ac8SHuacai Chen #define this_cpu_or_4(pcp, val) _percpu_or(pcp, val)
21746859ac8SHuacai Chen #define this_cpu_or_8(pcp, val) _percpu_or(pcp, val)
21846859ac8SHuacai Chen 
21946859ac8SHuacai Chen #define this_cpu_read_1(pcp) _percpu_read(pcp)
22046859ac8SHuacai Chen #define this_cpu_read_2(pcp) _percpu_read(pcp)
22146859ac8SHuacai Chen #define this_cpu_read_4(pcp) _percpu_read(pcp)
22246859ac8SHuacai Chen #define this_cpu_read_8(pcp) _percpu_read(pcp)
22346859ac8SHuacai Chen 
22446859ac8SHuacai Chen #define this_cpu_write_1(pcp, val) _percpu_write(pcp, val)
22546859ac8SHuacai Chen #define this_cpu_write_2(pcp, val) _percpu_write(pcp, val)
22646859ac8SHuacai Chen #define this_cpu_write_4(pcp, val) _percpu_write(pcp, val)
22746859ac8SHuacai Chen #define this_cpu_write_8(pcp, val) _percpu_write(pcp, val)
22846859ac8SHuacai Chen 
229720dc7abSHuacai Chen #define this_cpu_xchg_1(pcp, val) _percpu_xchg(pcp, val)
230720dc7abSHuacai Chen #define this_cpu_xchg_2(pcp, val) _percpu_xchg(pcp, val)
23146859ac8SHuacai Chen #define this_cpu_xchg_4(pcp, val) _percpu_xchg(pcp, val)
23246859ac8SHuacai Chen #define this_cpu_xchg_8(pcp, val) _percpu_xchg(pcp, val)
23346859ac8SHuacai Chen 
234720dc7abSHuacai Chen #define this_cpu_cmpxchg_1(ptr, o, n) _protect_cmpxchg_local(ptr, o, n)
235720dc7abSHuacai Chen #define this_cpu_cmpxchg_2(ptr, o, n) _protect_cmpxchg_local(ptr, o, n)
23646859ac8SHuacai Chen #define this_cpu_cmpxchg_4(ptr, o, n) _protect_cmpxchg_local(ptr, o, n)
23746859ac8SHuacai Chen #define this_cpu_cmpxchg_8(ptr, o, n) _protect_cmpxchg_local(ptr, o, n)
23846859ac8SHuacai Chen 
2395b0b14e5SHuacai Chen #include <asm-generic/percpu.h>
2405b0b14e5SHuacai Chen 
2415b0b14e5SHuacai Chen #endif /* __ASM_PERCPU_H */
242