1114117Simp/* SPDX-License-Identifier: GPL-2.0-only */
250476Speter/*
31592Srgrimes * Based on arch/arm/include/asm/barrier.h
4156813Sru *
5156813Sru * Copyright (C) 2012 ARM Ltd.
6241823Smarcel */
7241823Smarcel#ifndef __ASM_BARRIER_H
853909Speter#define __ASM_BARRIER_H
9183242Ssam
1053909Speter#ifndef __ASSEMBLY__
1153909Speter
1253909Speter#include <linux/kasan-checks.h>
13272322Sdelphij
14124587Sru#include <asm/alternative-macros.h>
15137675Sbz
16183242Ssam#define __nops(n)	".rept	" #n "\nnop\n.endr\n"
1753909Speter#define nops(n)		asm volatile(__nops(n))
1853909Speter
19143026Strhodes#define sev()		asm volatile("sev" : : : "memory")
2053909Speter#define wfe()		asm volatile("wfe" : : : "memory")
21104385Smike#define wfet(val)	asm volatile("msr s0_3_c1_c0_0, %0"	\
2253909Speter				     : : "r" (val) : "memory")
2353909Speter#define wfi()		asm volatile("wfi" : : : "memory")
2453909Speter#define wfit(val)	asm volatile("msr s0_3_c1_c0_1, %0"	\
25143026Strhodes				     : : "r" (val) : "memory")
26124587Sru
2770922Sdougb#define isb()		asm volatile("isb" : : : "memory")
28124587Sru#define dmb(opt)	asm volatile("dmb " #opt : : : "memory")
2953909Speter#define dsb(opt)	asm volatile("dsb " #opt : : : "memory")
30101808Sdwmalone
31183242Ssam#define psb_csync()	asm volatile("hint #17" : : : "memory")
32260024Sjmmv#define __tsb_csync()	asm volatile("hint #18" : : : "memory")
3353909Speter#define csdb()		asm volatile("hint #20" : : : "memory")
34171173Smlaier
35200062Sed/*
36137675Sbz * Data Gathering Hint:
371592Srgrimes * This instruction prevents merging memory accesses with Normal-NC or
38183242Ssam * Device-GRE attributes before the hint instruction with any memory accesses
39183242Ssam * appearing after the hint instruction.
40183242Ssam */
41183242Ssam#define dgh()		asm volatile("hint #6" : : : "memory")
42183242Ssam
43183242Ssam#ifdef CONFIG_ARM64_PSEUDO_NMI
44183242Ssam#define pmr_sync()						\
45183242Ssam	do {							\
46272322Sdelphij		asm volatile(					\
47272322Sdelphij		ALTERNATIVE_CB("dsb sy",			\
48272322Sdelphij			       ARM64_HAS_GIC_PRIO_RELAXED_SYNC,	\
49272322Sdelphij			       alt_cb_patch_nops)		\
50156813Sru		);						\
51137675Sbz	} while(0)
52137675Sbz#else
53137675Sbz#define pmr_sync()	do {} while (0)
54137675Sbz#endif
55183242Ssam
56183242Ssam#define __mb()		dsb(sy)
57183242Ssam#define __rmb()		dsb(ld)
58183242Ssam#define __wmb()		dsb(st)
59156813Sru
60171173Smlaier#define __dma_mb()	dmb(osh)
61126756Smlaier#define __dma_rmb()	dmb(oshld)
62126756Smlaier#define __dma_wmb()	dmb(oshst)
63173220Syar
64124587Sru#define io_stop_wc()	dgh()
6553909Speter
6653909Speter#define tsb_csync()								\
67156813Sru	do {									\
68143107Sru		/*								\
69143026Strhodes		 * CPUs affected by Arm Erratum 2054223 or 2067961 needs	\
70143026Strhodes		 * another TSB to ensure the trace is flushed. The barriers	\
71143026Strhodes		 * don't have to be strictly back to back, as long as the	\
72156813Sru		 * CPU is in trace prohibited state.				\
73124587Sru		 */								\
74183242Ssam		if (cpus_have_final_cap(ARM64_WORKAROUND_TSB_FLUSH_FAILURE))	\
7538101Speter			__tsb_csync();						\
7638101Speter		__tsb_csync();							\
77183242Ssam	} while (0)
78183242Ssam
79183242Ssam/*
80183242Ssam * Generate a mask for array_index__nospec() that is ~0UL when 0 <= idx < sz
81260013Sjmmv * and 0 otherwise.
82260013Sjmmv */
83260024Sjmmv#define array_index_mask_nospec array_index_mask_nospec
84260013Sjmmvstatic inline unsigned long array_index_mask_nospec(unsigned long idx,
85260013Sjmmv						    unsigned long sz)
861592Srgrimes{
87	unsigned long mask;
88
89	asm volatile(
90	"	cmp	%1, %2\n"
91	"	sbc	%0, xzr, xzr\n"
92	: "=r" (mask)
93	: "r" (idx), "Ir" (sz)
94	: "cc");
95
96	csdb();
97	return mask;
98}
99
100/*
101 * Ensure that reads of the counter are treated the same as memory reads
102 * for the purposes of ordering by subsequent memory barriers.
103 *
104 * This insanity brought to you by speculative system register reads,
105 * out-of-order memory accesses, sequence locks and Thomas Gleixner.
106 *
107 * https://lore.kernel.org/r/alpine.DEB.2.21.1902081950260.1662@nanos.tec.linutronix.de/
108 */
109#define arch_counter_enforce_ordering(val) do {				\
110	u64 tmp, _val = (val);						\
111									\
112	asm volatile(							\
113	"	eor	%0, %1, %1\n"					\
114	"	add	%0, sp, %0\n"					\
115	"	ldr	xzr, [%0]"					\
116	: "=r" (tmp) : "r" (_val));					\
117} while (0)
118
119#define __smp_mb()	dmb(ish)
120#define __smp_rmb()	dmb(ishld)
121#define __smp_wmb()	dmb(ishst)
122
123#define __smp_store_release(p, v)					\
124do {									\
125	typeof(p) __p = (p);						\
126	union { __unqual_scalar_typeof(*p) __val; char __c[1]; } __u =	\
127		{ .__val = (__force __unqual_scalar_typeof(*p)) (v) };	\
128	compiletime_assert_atomic_type(*p);				\
129	kasan_check_write(__p, sizeof(*p));				\
130	switch (sizeof(*p)) {						\
131	case 1:								\
132		asm volatile ("stlrb %w1, %0"				\
133				: "=Q" (*__p)				\
134				: "rZ" (*(__u8 *)__u.__c)		\
135				: "memory");				\
136		break;							\
137	case 2:								\
138		asm volatile ("stlrh %w1, %0"				\
139				: "=Q" (*__p)				\
140				: "rZ" (*(__u16 *)__u.__c)		\
141				: "memory");				\
142		break;							\
143	case 4:								\
144		asm volatile ("stlr %w1, %0"				\
145				: "=Q" (*__p)				\
146				: "rZ" (*(__u32 *)__u.__c)		\
147				: "memory");				\
148		break;							\
149	case 8:								\
150		asm volatile ("stlr %x1, %0"				\
151				: "=Q" (*__p)				\
152				: "rZ" (*(__u64 *)__u.__c)		\
153				: "memory");				\
154		break;							\
155	}								\
156} while (0)
157
158#define __smp_load_acquire(p)						\
159({									\
160	union { __unqual_scalar_typeof(*p) __val; char __c[1]; } __u;	\
161	typeof(p) __p = (p);						\
162	compiletime_assert_atomic_type(*p);				\
163	kasan_check_read(__p, sizeof(*p));				\
164	switch (sizeof(*p)) {						\
165	case 1:								\
166		asm volatile ("ldarb %w0, %1"				\
167			: "=r" (*(__u8 *)__u.__c)			\
168			: "Q" (*__p) : "memory");			\
169		break;							\
170	case 2:								\
171		asm volatile ("ldarh %w0, %1"				\
172			: "=r" (*(__u16 *)__u.__c)			\
173			: "Q" (*__p) : "memory");			\
174		break;							\
175	case 4:								\
176		asm volatile ("ldar %w0, %1"				\
177			: "=r" (*(__u32 *)__u.__c)			\
178			: "Q" (*__p) : "memory");			\
179		break;							\
180	case 8:								\
181		asm volatile ("ldar %0, %1"				\
182			: "=r" (*(__u64 *)__u.__c)			\
183			: "Q" (*__p) : "memory");			\
184		break;							\
185	}								\
186	(typeof(*p))__u.__val;						\
187})
188
189#define smp_cond_load_relaxed(ptr, cond_expr)				\
190({									\
191	typeof(ptr) __PTR = (ptr);					\
192	__unqual_scalar_typeof(*ptr) VAL;				\
193	for (;;) {							\
194		VAL = READ_ONCE(*__PTR);				\
195		if (cond_expr)						\
196			break;						\
197		__cmpwait_relaxed(__PTR, VAL);				\
198	}								\
199	(typeof(*ptr))VAL;						\
200})
201
202#define smp_cond_load_acquire(ptr, cond_expr)				\
203({									\
204	typeof(ptr) __PTR = (ptr);					\
205	__unqual_scalar_typeof(*ptr) VAL;				\
206	for (;;) {							\
207		VAL = smp_load_acquire(__PTR);				\
208		if (cond_expr)						\
209			break;						\
210		__cmpwait_relaxed(__PTR, VAL);				\
211	}								\
212	(typeof(*ptr))VAL;						\
213})
214
215#include <asm-generic/barrier.h>
216
217#endif	/* __ASSEMBLY__ */
218
219#endif	/* __ASM_BARRIER_H */
220