]>
Commit | Line | Data |
---|---|---|
b2441318 | 1 | /* SPDX-License-Identifier: GPL-2.0 */ |
527dcdcc DH |
2 | #ifndef __PARISC_LDCW_H |
3 | #define __PARISC_LDCW_H | |
4 | ||
527dcdcc DH |
5 | /* Because kmalloc only guarantees 8-byte alignment for kmalloc'd data, |
6 | and GCC only guarantees 8-byte alignment for stack locals, we can't | |
7 | be assured of 16-byte alignment for atomic lock data even if we | |
8 | specify "__attribute ((aligned(16)))" in the type declaration. So, | |
9 | we use a struct containing an array of four ints for the atomic lock | |
10 | type and dynamically select the 16-byte aligned int from the array | |
914988e0 JDA |
11 | for the semaphore. */ |
12 | ||
13 | /* From: "Jim Hull" <jim.hull of hp.com> | |
14 | I've attached a summary of the change, but basically, for PA 2.0, as | |
15 | long as the ",CO" (coherent operation) completer is implemented, then the | |
16 | 16-byte alignment requirement for ldcw and ldcd is relaxed, and instead | |
17 | they only require "natural" alignment (4-byte for ldcw, 8-byte for | |
18 | ldcd). | |
19 | ||
20 | Although the cache control hint is accepted by all PA 2.0 processors, | |
21 | it is only implemented on PA8800/PA8900 CPUs. Prior PA8X00 CPUs still | |
22 | require 16-byte alignment. If the address is unaligned, the operation | |
23 | of the instruction is undefined. The ldcw instruction does not generate | |
24 | unaligned data reference traps so misaligned accesses are not detected. | |
25 | This hid the problem for years. So, restore the 16-byte alignment dropped | |
26 | by Kyle McMartin in "Remove __ldcw_align for PA-RISC 2.0 processors". */ | |
527dcdcc DH |
27 | |
28 | #define __PA_LDCW_ALIGNMENT 16 | |
29 | #define __ldcw_align(a) ({ \ | |
30 | unsigned long __ret = (unsigned long) &(a)->lock[0]; \ | |
31 | __ret = (__ret + __PA_LDCW_ALIGNMENT - 1) \ | |
32 | & ~(__PA_LDCW_ALIGNMENT - 1); \ | |
33 | (volatile unsigned int *) __ret; \ | |
34 | }) | |
527dcdcc | 35 | |
914988e0 | 36 | #ifdef CONFIG_PA20 |
527dcdcc | 37 | #define __LDCW "ldcw,co" |
914988e0 JDA |
38 | #else |
39 | #define __LDCW "ldcw" | |
40 | #endif | |
527dcdcc | 41 | |
45db0738 JDA |
42 | /* LDCW, the only atomic read-write operation PA-RISC has. *sigh*. |
43 | We don't explicitly expose that "*a" may be written as reload | |
44 | fails to find a register in class R1_REGS when "a" needs to be | |
45 | reloaded when generating 64-bit PIC code. Instead, we clobber | |
46 | memory to indicate to the compiler that the assembly code reads | |
47 | or writes to items other than those listed in the input and output | |
48 | operands. This may pessimize the code somewhat but __ldcw is | |
d14b3dfc | 49 | usually used within code blocks surrounded by memory barriers. */ |
527dcdcc DH |
50 | #define __ldcw(a) ({ \ |
51 | unsigned __ret; \ | |
45db0738 JDA |
52 | __asm__ __volatile__(__LDCW " 0(%1),%0" \ |
53 | : "=r" (__ret) : "r" (a) : "memory"); \ | |
527dcdcc DH |
54 | __ret; \ |
55 | }) | |
56 | ||
57 | #ifdef CONFIG_SMP | |
b28fc0d8 | 58 | # define __lock_aligned __section(".data..lock_aligned") __aligned(16) |
527dcdcc DH |
59 | #endif |
60 | ||
61 | #endif /* __PARISC_LDCW_H */ |