1/*
2 * Copyright 2009-2016 Samy Al Bahra.
3 * Copyright 2013-2016 Olivier Houchard.
4 * All rights reserved.
5 *
6 * Redistribution and use in source and binary forms, with or without
7 * modification, are permitted provided that the following conditions
8 * are met:
9 * 1. Redistributions of source code must retain the above copyright
10 *    notice, this list of conditions and the following disclaimer.
11 * 2. Redistributions in binary form must reproduce the above copyright
12 *    notice, this list of conditions and the following disclaimer in the
13 *    documentation and/or other materials provided with the distribution.
14 *
15 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
16 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
17 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
18 * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
19 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
20 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
21 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
22 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
23 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
24 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
25 * SUCH DAMAGE.
26 */
27
28#ifndef CK_PR_AARCH64_LLSC_H
29#define CK_PR_AARCH64_LLSC_H
30
31#ifndef CK_PR_H
32#error Do not include this file directly, use ck_pr.h
33#endif
34
35CK_CC_INLINE static bool
36ck_pr_cas_64_2_value(uint64_t target[2], uint64_t compare[2], uint64_t set[2], uint64_t value[2])
37{
38        uint64_t tmp1, tmp2;
39
40        __asm__ __volatile__("1:"
41                             "ldxp %0, %1, [%4];"
42                             "mov %2, %0;"
43                             "mov %3, %1;"
44                             "eor %0, %0, %5;"
45                             "eor %1, %1, %6;"
46                             "orr %1, %0, %1;"
47                             "mov %w0, #0;"
48                             "cbnz %1, 2f;"
49                             "stxp %w0, %7, %8, [%4];"
50                             "cbnz %w0, 1b;"
51                             "mov %w0, #1;"
52                             "2:"
53                             : "=&r" (tmp1), "=&r" (tmp2), "=&r" (value[0]), "=&r" (value[1])
54                             : "r" (target), "r" (compare[0]), "r" (compare[1]), "r" (set[0]), "r" (set[1])
55                             : "cc", "memory");
56
57        return (tmp1);
58}
59
60CK_CC_INLINE static bool
61ck_pr_cas_ptr_2_value(void *target, void *compare, void *set, void *value)
62{
63        return (ck_pr_cas_64_2_value(CK_CPP_CAST(uint64_t *, target),
64                                   CK_CPP_CAST(uint64_t *, compare),
65                                   CK_CPP_CAST(uint64_t *, set),
66                                   CK_CPP_CAST(uint64_t *, value)));
67}
68
69CK_CC_INLINE static bool
70ck_pr_cas_64_2(uint64_t target[2], uint64_t compare[2], uint64_t set[2])
71{
72        uint64_t tmp1, tmp2;
73
74        __asm__ __volatile__("1:"
75                             "ldxp %0, %1, [%2];"
76                             "eor %0, %0, %3;"
77                             "eor %1, %1, %4;"
78                             "orr %1, %0, %1;"
79                             "mov %w0, #0;"
80                             "cbnz %1, 2f;"
81                             "stxp %w0, %5, %6, [%2];"
82                             "cbnz %w0, 1b;"
83                             "mov %w0, #1;"
84                             "2:"
85                             : "=&r" (tmp1), "=&r" (tmp2)
86                             : "r" (target), "r" (compare[0]), "r" (compare[1]), "r" (set[0]), "r" (set[1])
87                             : "cc", "memory");
88
89        return (tmp1);
90}
91CK_CC_INLINE static bool
92ck_pr_cas_ptr_2(void *target, void *compare, void *set)
93{
94        return (ck_pr_cas_64_2(CK_CPP_CAST(uint64_t *, target),
95                             CK_CPP_CAST(uint64_t *, compare),
96                             CK_CPP_CAST(uint64_t *, set)));
97}
98
99
100#define CK_PR_CAS(N, M, T, W, R)					\
101        CK_CC_INLINE static bool					\
102        ck_pr_cas_##N##_value(M *target, T compare, T set, M *value)	\
103        {								\
104                T previous;						\
105                T tmp;							\
106                __asm__ __volatile__("1:"				\
107                                     "ldxr" W " %" R "0, [%2];"		\
108                                     "cmp  %" R "0, %" R "4;"		\
109                                     "b.ne 2f;"				\
110                                     "stxr" W " %w1, %" R "3, [%2];"	\
111                                     "cbnz %w1, 1b;"			\
112                                     "2:"				\
113                    : "=&r" (previous),					\
114                    "=&r" (tmp)						\
115                    : "r"   (target),					\
116                    "r"   (set),					\
117                    "r"   (compare)					\
118                    : "memory", "cc");					\
119                *(T *)value = previous;					\
120                return (previous == compare);				\
121        }								\
122        CK_CC_INLINE static bool					\
123        ck_pr_cas_##N(M *target, T compare, T set)			\
124        {								\
125                T previous;						\
126                T tmp;							\
127                __asm__ __volatile__(					\
128                                     "1:"				\
129                                     "ldxr" W " %" R "0, [%2];"		\
130                                     "cmp  %" R "0, %" R "4;"		\
131                                     "b.ne 2f;"				\
132                                     "stxr" W " %w1, %" R "3, [%2];"	\
133                                     "cbnz %w1, 1b;"			\
134                                     "2:"				\
135                    : "=&r" (previous),					\
136                    "=&r" (tmp)						\
137                    : "r"   (target),					\
138                    "r"   (set),					\
139                    "r"   (compare)					\
140                    : "memory", "cc");					\
141                return (previous == compare);				\
142        }
143
144CK_PR_CAS(ptr, void, void *, "", "")
145
146#define CK_PR_CAS_S(N, M, W, R)	CK_PR_CAS(N, M, M, W, R)
147CK_PR_CAS_S(64, uint64_t, "", "")
148#ifndef CK_PR_DISABLE_DOUBLE
149CK_PR_CAS_S(double, double, "", "")
150#endif
151CK_PR_CAS_S(32, uint32_t, "", "w")
152CK_PR_CAS_S(uint, unsigned int, "", "w")
153CK_PR_CAS_S(int, int, "", "w")
154CK_PR_CAS_S(16, uint16_t, "h", "w")
155CK_PR_CAS_S(8, uint8_t, "b", "w")
156CK_PR_CAS_S(short, short, "h", "w")
157CK_PR_CAS_S(char, char, "b", "w")
158
159
160#undef CK_PR_CAS_S
161#undef CK_PR_CAS
162
163#define CK_PR_FAS(N, M, T, W, R)				\
164        CK_CC_INLINE static T					\
165        ck_pr_fas_##N(M *target, T v)				\
166        {							\
167                T previous;					\
168                T tmp;						\
169                __asm__ __volatile__("1:"			\
170                                     "ldxr" W " %" R "0, [%2];"	\
171                                     "stxr" W " %w1, %" R "3, [%2];"\
172                                     "cbnz %w1, 1b;"		\
173                                        : "=&r" (previous),	\
174                                          "=&r" (tmp) 		\
175                                        : "r"   (target),	\
176                                          "r"   (v)		\
177                                        : "memory", "cc");	\
178                return (previous);				\
179        }
180
181CK_PR_FAS(64, uint64_t, uint64_t, "", "")
182CK_PR_FAS(32, uint32_t, uint32_t, "", "w")
183CK_PR_FAS(ptr, void, void *, "", "")
184CK_PR_FAS(int, int, int, "", "w")
185CK_PR_FAS(uint, unsigned int, unsigned int, "", "w")
186CK_PR_FAS(16, uint16_t, uint16_t, "h", "w")
187CK_PR_FAS(8, uint8_t, uint8_t, "b", "w")
188CK_PR_FAS(short, short, short, "h", "w")
189CK_PR_FAS(char, char, char, "b", "w")
190
191
192#undef CK_PR_FAS
193
194#define CK_PR_UNARY(O, N, M, T, I, W, R)			\
195        CK_CC_INLINE static void				\
196        ck_pr_##O##_##N(M *target)				\
197        {							\
198                T previous = 0;					\
199                T tmp = 0;					\
200                __asm__ __volatile__("1:"			\
201                                     "ldxr" W " %" R "0, [%2];"	\
202                                      I ";"			\
203                                     "stxr" W " %w1, %" R "0, [%2];"	\
204                                     "cbnz %w1, 1b;"		\
205                                        : "=&r" (previous),	\
206                                          "=&r" (tmp)		\
207                                        : "r"   (target)	\
208                                        : "memory", "cc");	\
209                return;						\
210        }
211
212CK_PR_UNARY(inc, ptr, void, void *, "add %0, %0, #1", "", "")
213CK_PR_UNARY(dec, ptr, void, void *, "sub %0, %0, #1", "", "")
214CK_PR_UNARY(not, ptr, void, void *, "mvn %0, %0", "", "")
215CK_PR_UNARY(inc, 64, uint64_t, uint64_t, "add %0, %0, #1", "", "")
216CK_PR_UNARY(dec, 64, uint64_t, uint64_t, "sub %0, %0, #1", "", "")
217CK_PR_UNARY(not, 64, uint64_t, uint64_t, "mvn %0, %0", "", "")
218
219#define CK_PR_UNARY_S(S, T, W)					\
220        CK_PR_UNARY(inc, S, T, T, "add %w0, %w0, #1", W, "w")	\
221        CK_PR_UNARY(dec, S, T, T, "sub %w0, %w0, #1", W, "w")	\
222        CK_PR_UNARY(not, S, T, T, "mvn %w0, %w0", W, "w")	\
223
224CK_PR_UNARY_S(32, uint32_t, "")
225CK_PR_UNARY_S(uint, unsigned int, "")
226CK_PR_UNARY_S(int, int, "")
227CK_PR_UNARY_S(16, uint16_t, "h")
228CK_PR_UNARY_S(8, uint8_t, "b")
229CK_PR_UNARY_S(short, short, "h")
230CK_PR_UNARY_S(char, char, "b")
231
232#undef CK_PR_UNARY_S
233#undef CK_PR_UNARY
234
235#define CK_PR_BINARY(O, N, M, T, I, W, R)			\
236        CK_CC_INLINE static void				\
237        ck_pr_##O##_##N(M *target, T delta)			\
238        {							\
239                T previous;					\
240                T tmp;						\
241                __asm__ __volatile__("1:"			\
242                                     "ldxr" W " %" R "0, [%2];"\
243                                      I " %" R "0, %" R "0, %" R "3;"	\
244                                     "stxr" W " %w1, %" R "0, [%2];"	\
245                                     "cbnz %w1, 1b;"		\
246                                        : "=&r" (previous),	\
247                                          "=&r" (tmp)		\
248                                        : "r"   (target),	\
249                                          "r"   (delta)		\
250                                        : "memory", "cc");	\
251                return;						\
252        }
253
254CK_PR_BINARY(and, ptr, void, uintptr_t, "and", "", "")
255CK_PR_BINARY(add, ptr, void, uintptr_t, "add", "", "")
256CK_PR_BINARY(or, ptr, void, uintptr_t, "orr", "", "")
257CK_PR_BINARY(sub, ptr, void, uintptr_t, "sub", "", "")
258CK_PR_BINARY(xor, ptr, void, uintptr_t, "eor", "", "")
259CK_PR_BINARY(and, 64, uint64_t, uint64_t, "and", "", "")
260CK_PR_BINARY(add, 64, uint64_t, uint64_t, "add", "", "")
261CK_PR_BINARY(or, 64, uint64_t, uint64_t, "orr", "", "")
262CK_PR_BINARY(sub, 64, uint64_t, uint64_t, "sub", "", "")
263CK_PR_BINARY(xor, 64, uint64_t, uint64_t, "eor", "", "")
264
265#define CK_PR_BINARY_S(S, T, W)				\
266        CK_PR_BINARY(and, S, T, T, "and", W, "w")	\
267        CK_PR_BINARY(add, S, T, T, "add", W, "w")	\
268        CK_PR_BINARY(or, S, T, T, "orr", W, "w")	\
269        CK_PR_BINARY(sub, S, T, T, "sub", W, "w")	\
270        CK_PR_BINARY(xor, S, T, T, "eor", W, "w")
271
272CK_PR_BINARY_S(32, uint32_t, "")
273CK_PR_BINARY_S(uint, unsigned int, "")
274CK_PR_BINARY_S(int, int, "")
275CK_PR_BINARY_S(16, uint16_t, "h")
276CK_PR_BINARY_S(8, uint8_t, "b")
277CK_PR_BINARY_S(short, short, "h")
278CK_PR_BINARY_S(char, char, "b")
279
280#undef CK_PR_BINARY_S
281#undef CK_PR_BINARY
282
283CK_CC_INLINE static void *
284ck_pr_faa_ptr(void *target, uintptr_t delta)
285{
286        uintptr_t previous, r, tmp;
287
288        __asm__ __volatile__("1:"
289                             "ldxr %0, [%3];"
290                             "add %1, %4, %0;"
291                             "stxr %w2, %1, [%3];"
292                             "cbnz %w2, 1b;"
293                                : "=&r" (previous),
294                                  "=&r" (r),
295                                  "=&r" (tmp)
296                                : "r"   (target),
297                                  "r"   (delta)
298                                : "memory", "cc");
299
300        return (void *)(previous);
301}
302
303CK_CC_INLINE static uint64_t
304ck_pr_faa_64(uint64_t *target, uint64_t delta)
305{
306        uint64_t previous, r, tmp;
307
308        __asm__ __volatile__("1:"
309                             "ldxr %0, [%3];"
310                             "add %1, %4, %0;"
311                             "stxr %w2, %1, [%3];"
312                             "cbnz %w2, 1b;"
313                                : "=&r" (previous),
314                                  "=&r" (r),
315                                  "=&r" (tmp)
316                                : "r"   (target),
317                                  "r"   (delta)
318                                : "memory", "cc");
319
320        return (previous);
321}
322
323#define CK_PR_FAA(S, T, W)						\
324        CK_CC_INLINE static T						\
325        ck_pr_faa_##S(T *target, T delta)				\
326        {								\
327                T previous, r, tmp;					\
328                __asm__ __volatile__("1:"				\
329                                     "ldxr" W " %w0, [%3];"		\
330                                     "add %w1, %w4, %w0;"		\
331                                     "stxr" W " %w2, %w1, [%3];"	\
332                                     "cbnz %w2, 1b;"			\
333                                        : "=&r" (previous),		\
334                                          "=&r" (r),			\
335                                          "=&r" (tmp)			\
336                                        : "r"   (target),		\
337                                          "r"   (delta)			\
338                                        : "memory", "cc");		\
339                return (previous);					\
340        }
341
342CK_PR_FAA(32, uint32_t, "")
343CK_PR_FAA(uint, unsigned int, "")
344CK_PR_FAA(int, int, "")
345CK_PR_FAA(16, uint16_t, "h")
346CK_PR_FAA(8, uint8_t, "b")
347CK_PR_FAA(short, short, "h")
348CK_PR_FAA(char, char, "b")
349
350#undef CK_PR_FAA
351
352#endif /* CK_PR_AARCH64_LLSC_H */
353