| 1 | /* |
| 2 | * Copyright (c) 2003 Hewlett-Packard Development Company, L.P. |
| 3 | * |
| 4 | * Permission is hereby granted, free of charge, to any person obtaining a copy |
| 5 | * of this software and associated documentation files (the "Software"), to deal |
| 6 | * in the Software without restriction, including without limitation the rights |
| 7 | * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell |
| 8 | * copies of the Software, and to permit persons to whom the Software is |
| 9 | * furnished to do so, subject to the following conditions: |
| 10 | * |
| 11 | * The above copyright notice and this permission notice shall be included in |
| 12 | * all copies or substantial portions of the Software. |
| 13 | * |
| 14 | * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR |
| 15 | * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, |
| 16 | * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE |
| 17 | * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER |
| 18 | * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, |
| 19 | * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE |
| 20 | * SOFTWARE. |
| 21 | */ |
| 22 | |
| 23 | #include "../all_atomic_load_store.h" |
| 24 | |
| 25 | /* Some architecture set descriptions include special "ordered" memory */ |
| 26 | /* operations. As far as we can tell, no existing processors actually */ |
| 27 | /* require those. Nor does it appear likely that future processors */ |
| 28 | /* will. */ |
| 29 | #include "../ordered.h" |
| 30 | |
| 31 | /* GCC will not guarantee the alignment we need, use four lock words */ |
| 32 | /* and select the correctly aligned datum. See the glibc 2.3.2 */ |
| 33 | /* linuxthread port for the original implementation. */ |
| 34 | struct AO_pa_clearable_loc { |
| 35 | int data[4]; |
| 36 | }; |
| 37 | |
| 38 | #undef AO_TS_INITIALIZER |
| 39 | #define AO_TS_t struct AO_pa_clearable_loc |
| 40 | #define AO_TS_INITIALIZER { { 1, 1, 1, 1 } } |
| 41 | /* Switch meaning of set and clear, since we only have an atomic clear */ |
| 42 | /* instruction. */ |
| 43 | typedef enum {AO_PA_TS_set = 0, AO_PA_TS_clear = 1} AO_PA_TS_val; |
| 44 | #define AO_TS_VAL_t AO_PA_TS_val |
| 45 | #define AO_TS_CLEAR AO_PA_TS_clear |
| 46 | #define AO_TS_SET AO_PA_TS_set |
| 47 | |
| 48 | /* The hppa only has one atomic read and modify memory operation, */ |
| 49 | /* load and clear, so hppa spinlocks must use zero to signify that */ |
| 50 | /* someone is holding the lock. The address used for the ldcw */ |
| 51 | /* semaphore must be 16-byte aligned. */ |
| 52 | #define AO_ldcw(a, ret) \ |
| 53 | __asm__ __volatile__("ldcw 0(%2), %0" \ |
| 54 | : "=r" (ret), "=m" (*(a)) : "r" (a)) |
| 55 | |
| 56 | /* Because malloc only guarantees 8-byte alignment for malloc'd data, */ |
| 57 | /* and GCC only guarantees 8-byte alignment for stack locals, we can't */ |
| 58 | /* be assured of 16-byte alignment for atomic lock data even if we */ |
| 59 | /* specify "__attribute ((aligned(16)))" in the type declaration. So, */ |
| 60 | /* we use a struct containing an array of four ints for the atomic lock */ |
| 61 | /* type and dynamically select the 16-byte aligned int from the array */ |
| 62 | /* for the semaphore. */ |
| 63 | #define AO_PA_LDCW_ALIGNMENT 16 |
| 64 | #define AO_ldcw_align(addr) \ |
| 65 | ((volatile unsigned *)(((unsigned long)(addr) \ |
| 66 | + (AO_PA_LDCW_ALIGNMENT - 1)) \ |
| 67 | & ~(AO_PA_LDCW_ALIGNMENT - 1))) |
| 68 | |
| 69 | /* Works on PA 1.1 and PA 2.0 systems */ |
| 70 | AO_INLINE AO_TS_VAL_t |
| 71 | AO_test_and_set_full(volatile AO_TS_t * addr) |
| 72 | { |
| 73 | volatile unsigned int ret; |
| 74 | volatile unsigned *a = AO_ldcw_align(addr); |
| 75 | |
| 76 | AO_ldcw(a, ret); |
| 77 | return (AO_TS_VAL_t)ret; |
| 78 | } |
| 79 | #define AO_HAVE_test_and_set_full |
| 80 | |
| 81 | AO_INLINE void |
| 82 | AO_pa_clear(volatile AO_TS_t * addr) |
| 83 | { |
| 84 | volatile unsigned *a = AO_ldcw_align(addr); |
| 85 | |
| 86 | AO_compiler_barrier(); |
| 87 | *a = 1; |
| 88 | } |
| 89 | #define AO_CLEAR(addr) AO_pa_clear(addr) |
| 90 | #define AO_HAVE_CLEAR |
| 91 | |
| 92 | #undef AO_PA_LDCW_ALIGNMENT |
| 93 | #undef AO_ldcw |
| 94 | #undef AO_ldcw_align |
| 95 | |