xref: /openbmc/linux/arch/riscv/include/asm/barrier.h (revision 4f2c0a4acffbec01079c28f839422e64ddeff004)
1caab277bSThomas Gleixner /* SPDX-License-Identifier: GPL-2.0-only */
2fab957c1SPalmer Dabbelt /*
3fab957c1SPalmer Dabbelt  * Based on arch/arm/include/asm/barrier.h
4fab957c1SPalmer Dabbelt  *
5fab957c1SPalmer Dabbelt  * Copyright (C) 2012 ARM Ltd.
6fab957c1SPalmer Dabbelt  * Copyright (C) 2013 Regents of the University of California
7fab957c1SPalmer Dabbelt  * Copyright (C) 2017 SiFive
8fab957c1SPalmer Dabbelt  */
9fab957c1SPalmer Dabbelt 
10fab957c1SPalmer Dabbelt #ifndef _ASM_RISCV_BARRIER_H
11fab957c1SPalmer Dabbelt #define _ASM_RISCV_BARRIER_H
12fab957c1SPalmer Dabbelt 
13fab957c1SPalmer Dabbelt #ifndef __ASSEMBLY__
14fab957c1SPalmer Dabbelt 
15fab957c1SPalmer Dabbelt #define nop()		__asm__ __volatile__ ("nop")
16*c295bc34SHeiko Stuebner #define __nops(n)	".rept	" #n "\nnop\n.endr\n"
17*c295bc34SHeiko Stuebner #define nops(n)		__asm__ __volatile__ (__nops(n))
18fab957c1SPalmer Dabbelt 
19fab957c1SPalmer Dabbelt #define RISCV_FENCE(p, s) \
20fab957c1SPalmer Dabbelt 	__asm__ __volatile__ ("fence " #p "," #s : : : "memory")
21fab957c1SPalmer Dabbelt 
22fab957c1SPalmer Dabbelt /* These barriers need to enforce ordering on both devices or memory. */
23fab957c1SPalmer Dabbelt #define mb()		RISCV_FENCE(iorw,iorw)
24fab957c1SPalmer Dabbelt #define rmb()		RISCV_FENCE(ir,ir)
25fab957c1SPalmer Dabbelt #define wmb()		RISCV_FENCE(ow,ow)
26fab957c1SPalmer Dabbelt 
27fab957c1SPalmer Dabbelt /* These barriers do not need to enforce ordering on devices, just memory. */
28ab4af605SAndrea Parri #define __smp_mb()	RISCV_FENCE(rw,rw)
29ab4af605SAndrea Parri #define __smp_rmb()	RISCV_FENCE(r,r)
30ab4af605SAndrea Parri #define __smp_wmb()	RISCV_FENCE(w,w)
31fab957c1SPalmer Dabbelt 
328d235b17SAndrea Parri #define __smp_store_release(p, v)					\
338d235b17SAndrea Parri do {									\
348d235b17SAndrea Parri 	compiletime_assert_atomic_type(*p);				\
358d235b17SAndrea Parri 	RISCV_FENCE(rw,w);						\
368d235b17SAndrea Parri 	WRITE_ONCE(*p, v);						\
378d235b17SAndrea Parri } while (0)
388d235b17SAndrea Parri 
398d235b17SAndrea Parri #define __smp_load_acquire(p)						\
408d235b17SAndrea Parri ({									\
418d235b17SAndrea Parri 	typeof(*p) ___p1 = READ_ONCE(*p);				\
428d235b17SAndrea Parri 	compiletime_assert_atomic_type(*p);				\
438d235b17SAndrea Parri 	RISCV_FENCE(r,rw);						\
448d235b17SAndrea Parri 	___p1;								\
458d235b17SAndrea Parri })
468d235b17SAndrea Parri 
473cfa5008SPalmer Dabbelt /*
483cfa5008SPalmer Dabbelt  * This is a very specific barrier: it's currently only used in two places in
493cfa5008SPalmer Dabbelt  * the kernel, both in the scheduler.  See include/linux/spinlock.h for the two
503cfa5008SPalmer Dabbelt  * orderings it guarantees, but the "critical section is RCsc" guarantee
513cfa5008SPalmer Dabbelt  * mandates a barrier on RISC-V.  The sequence looks like:
523cfa5008SPalmer Dabbelt  *
533cfa5008SPalmer Dabbelt  *    lr.aq lock
543cfa5008SPalmer Dabbelt  *    sc    lock <= LOCKED
553cfa5008SPalmer Dabbelt  *    smp_mb__after_spinlock()
563cfa5008SPalmer Dabbelt  *    // critical section
573cfa5008SPalmer Dabbelt  *    lr    lock
583cfa5008SPalmer Dabbelt  *    sc.rl lock <= UNLOCKED
593cfa5008SPalmer Dabbelt  *
603cfa5008SPalmer Dabbelt  * The AQ/RL pair provides a RCpc critical section, but there's not really any
613cfa5008SPalmer Dabbelt  * way we can take advantage of that here because the ordering is only enforced
623cfa5008SPalmer Dabbelt  * on that one lock.  Thus, we're just doing a full fence.
6338b7c2a3SPalmer Dabbelt  *
6438b7c2a3SPalmer Dabbelt  * Since we allow writeX to be called from preemptive regions we need at least
6538b7c2a3SPalmer Dabbelt  * an "o" in the predecessor set to ensure device writes are visible before the
6638b7c2a3SPalmer Dabbelt  * task is marked as available for scheduling on a new hart.  While I don't see
6738b7c2a3SPalmer Dabbelt  * any concrete reason we need a full IO fence, it seems safer to just upgrade
6838b7c2a3SPalmer Dabbelt  * this in order to avoid any IO crossing a scheduling boundary.  In both
6938b7c2a3SPalmer Dabbelt  * instances the scheduler pairs this with an mb(), so nothing is necessary on
7038b7c2a3SPalmer Dabbelt  * the new hart.
713cfa5008SPalmer Dabbelt  */
7238b7c2a3SPalmer Dabbelt #define smp_mb__after_spinlock()	RISCV_FENCE(iorw,iorw)
733cfa5008SPalmer Dabbelt 
74fab957c1SPalmer Dabbelt #include <asm-generic/barrier.h>
75fab957c1SPalmer Dabbelt 
76fab957c1SPalmer Dabbelt #endif /* __ASSEMBLY__ */
77fab957c1SPalmer Dabbelt 
78fab957c1SPalmer Dabbelt #endif /* _ASM_RISCV_BARRIER_H */
79