1/* Shared HTM header. Work around false transactional execution facility
2 intrinsics.
3
4 Copyright (C) 2016-2022 Free Software Foundation, Inc.
5 This file is part of the GNU C Library.
6
7 The GNU C Library is free software; you can redistribute it and/or
8 modify it under the terms of the GNU Lesser General Public
9 License as published by the Free Software Foundation; either
10 version 2.1 of the License, or (at your option) any later version.
11
12 The GNU C Library is distributed in the hope that it will be useful,
13 but WITHOUT ANY WARRANTY; without even the implied warranty of
14 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
15 Lesser General Public License for more details.
16
17 You should have received a copy of the GNU Lesser General Public
18 License along with the GNU C Library; if not, see
19 <https://www.gnu.org/licenses/>. */
20
21#ifndef _HTM_H
22#define _HTM_H 1
23
24#include <htmintrin.h>
25
26#ifdef __s390x__
27# define TX_FPRS_BYTES 64
28# define TX_SAVE_FPRS \
29 " std %%f8, 0(%[R_FPRS])\n\t" \
30 " std %%f9, 8(%[R_FPRS])\n\t" \
31 " std %%f10, 16(%[R_FPRS])\n\t" \
32 " std %%f11, 24(%[R_FPRS])\n\t" \
33 " std %%f12, 32(%[R_FPRS])\n\t" \
34 " std %%f13, 40(%[R_FPRS])\n\t" \
35 " std %%f14, 48(%[R_FPRS])\n\t" \
36 " std %%f15, 56(%[R_FPRS])\n\t"
37
38# define TX_RESTORE_FPRS \
39 " ld %%f8, 0(%[R_FPRS])\n\t" \
40 " ld %%f9, 8(%[R_FPRS])\n\t" \
41 " ld %%f10, 16(%[R_FPRS])\n\t" \
42 " ld %%f11, 24(%[R_FPRS])\n\t" \
43 " ld %%f12, 32(%[R_FPRS])\n\t" \
44 " ld %%f13, 40(%[R_FPRS])\n\t" \
45 " ld %%f14, 48(%[R_FPRS])\n\t" \
46 " ld %%f15, 56(%[R_FPRS])\n\t"
47
48#else
49
50# define TX_FPRS_BYTES 16
51# define TX_SAVE_FPRS \
52 " std %%f4, 0(%[R_FPRS])\n\t" \
53 " std %%f6, 8(%[R_FPRS])\n\t"
54
55# define TX_RESTORE_FPRS \
56 " ld %%f4, 0(%[R_FPRS])\n\t" \
57 " ld %%f6, 8(%[R_FPRS])\n\t"
58
59#endif /* ! __s390x__ */
60
61/* Use own inline assembly instead of __builtin_tbegin, as tbegin
62 has to filter program interruptions which can't be done with the builtin.
63 Now the fprs have to be saved / restored here, too.
64 The fpc is also not saved / restored with the builtin.
65 The used inline assembly does not clobber the volatile fprs / vrs!
66 Clobbering the latter ones would force the compiler to save / restore
67 the call saved fprs as those overlap with the vrs, but they only need to be
68 restored if the transaction fails but not if the transaction is successfully
69 started. Thus the user of the tbegin macros in this header file has to
70 compile the file / function with -msoft-float. It prevents gcc from using
71 fprs / vrs. */
72#define __libc_tbegin(tdb) __libc_tbegin_base(tdb,,,)
73
74#define __libc_tbegin_retry_output_regs , [R_TX_CNT] "+&d" (__tx_cnt)
75#define __libc_tbegin_retry_input_regs(retry_cnt) , [R_RETRY] "d" (retry_cnt)
76#define __libc_tbegin_retry_abort_path_insn \
77 /* If tbegin returned _HTM_TBEGIN_TRANSIENT, retry immediately so \
78 that max tbegin_cnt transactions are tried. Otherwise return and \
79 let the caller of this macro do the fallback path. */ \
80 " jnh 1f\n\t" /* cc 1/3: jump to fallback path. */ \
81 /* tbegin returned _HTM_TBEGIN_TRANSIENT: retry with transaction. */ \
82 " crje %[R_TX_CNT], %[R_RETRY], 1f\n\t" /* Reached max retries? */ \
83 " ahi %[R_TX_CNT], 1\n\t" \
84 " ppa %[R_TX_CNT], 0, 1\n\t" /* Transaction-Abort Assist. */ \
85 " j 2b\n\t" /* Loop to tbegin. */
86
87/* Same as __libc_tbegin except if tbegin aborts with _HTM_TBEGIN_TRANSIENT.
88 Then this macros restores the fpc, fprs and automatically retries up to
89 retry_cnt tbegins. Further saving of the state is omitted as it is already
90 saved. This macro calls tbegin at most as retry_cnt + 1 times. */
91#define __libc_tbegin_retry(tdb, retry_cnt) \
92 ({ int __ret; \
93 int __tx_cnt = 0; \
94 __ret = __libc_tbegin_base(tdb, \
95 __libc_tbegin_retry_abort_path_insn, \
96 __libc_tbegin_retry_output_regs, \
97 __libc_tbegin_retry_input_regs(retry_cnt)); \
98 __ret; \
99 })
100
101#define __libc_tbegin_base(tdb, abort_path_insn, output_regs, input_regs) \
102 ({ int __ret; \
103 int __fpc; \
104 char __fprs[TX_FPRS_BYTES]; \
105 __asm__ __volatile__ (".machine push\n\t" \
106 ".machinemode \"zarch_nohighgprs\"\n\t" \
107 ".machine \"all\"\n\t" \
108 /* Save state at the outermost transaction. \
109 As extracting nesting depth is expensive \
110 on at least zEC12, save fprs at inner \
111 transactions, too. \
112 The fpc and fprs are saved here as they \
113 are not saved by tbegin. There exist no \
114 call-saved vrs, thus they are not saved \
115 here. */ \
116 " efpc %[R_FPC]\n\t" \
117 TX_SAVE_FPRS \
118 /* Begin transaction: save all gprs, allow \
119 ar modification and fp operations. Some \
120 program-interruptions (e.g. a null \
121 pointer access) are filtered and the \
122 transaction will abort. In this case \
123 the normal lock path will execute it \
124 again and result in a core dump wich does \
125 now show at tbegin but the real executed \
126 instruction. \
127 However it is not guaranteed that this \
128 retry operate on the same data and thus \
129 may not end in an program-interruption. \
130 Note: This could also be used to probe \
131 memory for being accessible! */ \
132 "2: tbegin 0, 0xFF0E\n\t" \
133 /* Branch away in abort case (this is the \
134 prefered sequence. See PoP in chapter 5 \
135 Transactional-Execution Facility \
136 Operation). */ \
137 " jnz 0f\n\t" \
138 /* Transaction has successfully started. */ \
139 " lhi %[R_RET], 0\n\t" \
140 " j 1f\n\t" \
141 /* Transaction has aborted. Now we are at \
142 the outermost transaction. Restore fprs \
143 and fpc. */ \
144 "0: ipm %[R_RET]\n\t" \
145 " srl %[R_RET], 28\n\t" \
146 " sfpc %[R_FPC]\n\t" \
147 TX_RESTORE_FPRS \
148 abort_path_insn \
149 "1:\n\t" \
150 ".machine pop\n" \
151 : [R_RET] "=&d" (__ret), \
152 [R_FPC] "=&d" (__fpc) \
153 output_regs \
154 : [R_FPRS] "a" (__fprs) \
155 input_regs \
156 : "cc", "memory"); \
157 __ret; \
158 })
159
160/* These builtins are usable in context of glibc lock elision code without any
161 changes. Use them. */
162#define __libc_tend() \
163 ({ __asm__ __volatile__ (".machine push\n\t" \
164 ".machinemode \"zarch_nohighgprs\"\n\t" \
165 ".machine \"all\"\n\t"); \
166 int __ret = __builtin_tend (); \
167 __asm__ __volatile__ (".machine pop"); \
168 __ret; \
169 })
170
171#define __libc_tabort(abortcode) \
172 __asm__ __volatile__ (".machine push\n\t" \
173 ".machinemode \"zarch_nohighgprs\"\n\t" \
174 ".machine \"all\"\n\t"); \
175 __builtin_tabort (abortcode); \
176 __asm__ __volatile__ (".machine pop")
177
178#define __libc_tx_nesting_depth() \
179 ({ __asm__ __volatile__ (".machine push\n\t" \
180 ".machinemode \"zarch_nohighgprs\"\n\t" \
181 ".machine \"all\"\n\t"); \
182 int __ret = __builtin_tx_nesting_depth (); \
183 __asm__ __volatile__ (".machine pop"); \
184 __ret; \
185 })
186
187#endif
188

source code of glibc/sysdeps/unix/sysv/linux/s390/htm.h