rseq-ppc.h 8.9 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238
  1. /* SPDX-License-Identifier: LGPL-2.1 OR MIT */
  2. /*
  3. * rseq-ppc.h
  4. *
  5. * (C) Copyright 2016-2022 - Mathieu Desnoyers <mathieu.desnoyers@efficios.com>
  6. * (C) Copyright 2016-2018 - Boqun Feng <boqun.feng@gmail.com>
  7. */
  8. /*
  9. * RSEQ_SIG is used with the following trap instruction:
  10. *
  11. * powerpc-be: 0f e5 00 0b twui r5,11
  12. * powerpc64-le: 0b 00 e5 0f twui r5,11
  13. * powerpc64-be: 0f e5 00 0b twui r5,11
  14. */
  15. #define RSEQ_SIG 0x0fe5000b
  16. #define rseq_smp_mb() __asm__ __volatile__ ("sync" ::: "memory", "cc")
  17. #define rseq_smp_lwsync() __asm__ __volatile__ ("lwsync" ::: "memory", "cc")
  18. #define rseq_smp_rmb() rseq_smp_lwsync()
  19. #define rseq_smp_wmb() rseq_smp_lwsync()
  20. #define rseq_smp_load_acquire(p) \
  21. __extension__ ({ \
  22. rseq_unqual_scalar_typeof(*(p)) ____p1 = RSEQ_READ_ONCE(*(p)); \
  23. rseq_smp_lwsync(); \
  24. ____p1; \
  25. })
  26. #define rseq_smp_acquire__after_ctrl_dep() rseq_smp_lwsync()
  27. #define rseq_smp_store_release(p, v) \
  28. do { \
  29. rseq_smp_lwsync(); \
  30. RSEQ_WRITE_ONCE(*(p), v); \
  31. } while (0)
  32. /*
  33. * The __rseq_cs_ptr_array and __rseq_cs sections can be used by debuggers to
  34. * better handle single-stepping through the restartable critical sections.
  35. */
  36. #ifdef __PPC64__
  37. #define RSEQ_STORE_LONG(arg) "std%U[" __rseq_str(arg) "]%X[" __rseq_str(arg) "] " /* To memory ("m" constraint) */
  38. #define RSEQ_STORE_INT(arg) "stw%U[" __rseq_str(arg) "]%X[" __rseq_str(arg) "] " /* To memory ("m" constraint) */
  39. #define RSEQ_LOAD_LONG(arg) "ld%U[" __rseq_str(arg) "]%X[" __rseq_str(arg) "] " /* From memory ("m" constraint) */
  40. #define RSEQ_LOAD_INT(arg) "lwz%U[" __rseq_str(arg) "]%X[" __rseq_str(arg) "] " /* From memory ("m" constraint) */
  41. #define RSEQ_LOADX_LONG "ldx " /* From base register ("b" constraint) */
  42. #define RSEQ_CMP_LONG "cmpd "
  43. #define RSEQ_CMP_LONG_INT "cmpdi "
  44. #define __RSEQ_ASM_DEFINE_TABLE(label, version, flags, \
  45. start_ip, post_commit_offset, abort_ip) \
  46. ".pushsection __rseq_cs, \"aw\"\n\t" \
  47. ".balign 32\n\t" \
  48. __rseq_str(label) ":\n\t" \
  49. ".long " __rseq_str(version) ", " __rseq_str(flags) "\n\t" \
  50. ".quad " __rseq_str(start_ip) ", " __rseq_str(post_commit_offset) ", " __rseq_str(abort_ip) "\n\t" \
  51. ".popsection\n\t" \
  52. ".pushsection __rseq_cs_ptr_array, \"aw\"\n\t" \
  53. ".quad " __rseq_str(label) "b\n\t" \
  54. ".popsection\n\t"
  55. #define RSEQ_ASM_STORE_RSEQ_CS(label, cs_label, rseq_cs) \
  56. RSEQ_INJECT_ASM(1) \
  57. "lis %%r17, (" __rseq_str(cs_label) ")@highest\n\t" \
  58. "ori %%r17, %%r17, (" __rseq_str(cs_label) ")@higher\n\t" \
  59. "rldicr %%r17, %%r17, 32, 31\n\t" \
  60. "oris %%r17, %%r17, (" __rseq_str(cs_label) ")@high\n\t" \
  61. "ori %%r17, %%r17, (" __rseq_str(cs_label) ")@l\n\t" \
  62. "std %%r17, %[" __rseq_str(rseq_cs) "]\n\t" \
  63. __rseq_str(label) ":\n\t"
  64. /*
  65. * Exit points of a rseq critical section consist of all instructions outside
  66. * of the critical section where a critical section can either branch to or
  67. * reach through the normal course of its execution. The abort IP and the
  68. * post-commit IP are already part of the __rseq_cs section and should not be
  69. * explicitly defined as additional exit points. Knowing all exit points is
  70. * useful to assist debuggers stepping over the critical section.
  71. */
  72. #define RSEQ_ASM_DEFINE_EXIT_POINT(start_ip, exit_ip) \
  73. ".pushsection __rseq_exit_point_array, \"aw\"\n\t" \
  74. ".quad " __rseq_str(start_ip) ", " __rseq_str(exit_ip) "\n\t" \
  75. ".popsection\n\t"
  76. #else /* #ifdef __PPC64__ */
  77. #define RSEQ_STORE_LONG(arg) "stw%U[" __rseq_str(arg) "]%X[" __rseq_str(arg) "] " /* To memory ("m" constraint) */
  78. #define RSEQ_STORE_INT(arg) RSEQ_STORE_LONG(arg) /* To memory ("m" constraint) */
  79. #define RSEQ_LOAD_LONG(arg) "lwz%U[" __rseq_str(arg) "]%X[" __rseq_str(arg) "] " /* From memory ("m" constraint) */
  80. #define RSEQ_LOAD_INT(arg) RSEQ_LOAD_LONG(arg) /* From memory ("m" constraint) */
  81. #define RSEQ_LOADX_LONG "lwzx " /* From base register ("b" constraint) */
  82. #define RSEQ_CMP_LONG "cmpw "
  83. #define RSEQ_CMP_LONG_INT "cmpwi "
  84. #define __RSEQ_ASM_DEFINE_TABLE(label, version, flags, \
  85. start_ip, post_commit_offset, abort_ip) \
  86. ".pushsection __rseq_cs, \"aw\"\n\t" \
  87. ".balign 32\n\t" \
  88. __rseq_str(label) ":\n\t" \
  89. ".long " __rseq_str(version) ", " __rseq_str(flags) "\n\t" \
  90. /* 32-bit only supported on BE */ \
  91. ".long 0x0, " __rseq_str(start_ip) ", 0x0, " __rseq_str(post_commit_offset) ", 0x0, " __rseq_str(abort_ip) "\n\t" \
  92. ".popsection\n\t" \
  93. ".pushsection __rseq_cs_ptr_array, \"aw\"\n\t" \
  94. ".long 0x0, " __rseq_str(label) "b\n\t" \
  95. ".popsection\n\t"
  96. /*
  97. * Exit points of a rseq critical section consist of all instructions outside
  98. * of the critical section where a critical section can either branch to or
  99. * reach through the normal course of its execution. The abort IP and the
  100. * post-commit IP are already part of the __rseq_cs section and should not be
  101. * explicitly defined as additional exit points. Knowing all exit points is
  102. * useful to assist debuggers stepping over the critical section.
  103. */
  104. #define RSEQ_ASM_DEFINE_EXIT_POINT(start_ip, exit_ip) \
  105. ".pushsection __rseq_exit_point_array, \"aw\"\n\t" \
  106. /* 32-bit only supported on BE */ \
  107. ".long 0x0, " __rseq_str(start_ip) ", 0x0, " __rseq_str(exit_ip) "\n\t" \
  108. ".popsection\n\t"
  109. #define RSEQ_ASM_STORE_RSEQ_CS(label, cs_label, rseq_cs) \
  110. RSEQ_INJECT_ASM(1) \
  111. "lis %%r17, (" __rseq_str(cs_label) ")@ha\n\t" \
  112. "addi %%r17, %%r17, (" __rseq_str(cs_label) ")@l\n\t" \
  113. RSEQ_STORE_INT(rseq_cs) "%%r17, %[" __rseq_str(rseq_cs) "]\n\t" \
  114. __rseq_str(label) ":\n\t"
  115. #endif /* #ifdef __PPC64__ */
  116. #define RSEQ_ASM_DEFINE_TABLE(label, start_ip, post_commit_ip, abort_ip) \
  117. __RSEQ_ASM_DEFINE_TABLE(label, 0x0, 0x0, start_ip, \
  118. (post_commit_ip - start_ip), abort_ip)
  119. #define RSEQ_ASM_CMP_CPU_ID(cpu_id, current_cpu_id, label) \
  120. RSEQ_INJECT_ASM(2) \
  121. RSEQ_LOAD_INT(current_cpu_id) "%%r17, %[" __rseq_str(current_cpu_id) "]\n\t" \
  122. "cmpw cr7, %[" __rseq_str(cpu_id) "], %%r17\n\t" \
  123. "bne- cr7, " __rseq_str(label) "\n\t"
  124. #define RSEQ_ASM_DEFINE_ABORT(label, abort_label) \
  125. ".pushsection __rseq_failure, \"ax\"\n\t" \
  126. ".long " __rseq_str(RSEQ_SIG) "\n\t" \
  127. __rseq_str(label) ":\n\t" \
  128. "b %l[" __rseq_str(abort_label) "]\n\t" \
  129. ".popsection\n\t"
  130. /*
  131. * RSEQ_ASM_OPs: asm operations for rseq
  132. * RSEQ_ASM_OP_R_*: has hard-code registers in it
  133. * RSEQ_ASM_OP_* (else): doesn't have hard-code registers(unless cr7)
  134. */
  135. #define RSEQ_ASM_OP_CMPEQ(var, expect, label) \
  136. RSEQ_LOAD_LONG(var) "%%r17, %[" __rseq_str(var) "]\n\t" \
  137. RSEQ_CMP_LONG "cr7, %%r17, %[" __rseq_str(expect) "]\n\t" \
  138. "bne- cr7, " __rseq_str(label) "\n\t"
  139. #define RSEQ_ASM_OP_CMPNE(var, expectnot, label) \
  140. RSEQ_LOAD_LONG(var) "%%r17, %[" __rseq_str(var) "]\n\t" \
  141. RSEQ_CMP_LONG "cr7, %%r17, %[" __rseq_str(expectnot) "]\n\t" \
  142. "beq- cr7, " __rseq_str(label) "\n\t"
  143. #define RSEQ_ASM_OP_STORE(value, var) \
  144. RSEQ_STORE_LONG(var) "%[" __rseq_str(value) "], %[" __rseq_str(var) "]\n\t"
  145. /* Load @var to r17 */
  146. #define RSEQ_ASM_OP_R_LOAD(var) \
  147. RSEQ_LOAD_LONG(var) "%%r17, %[" __rseq_str(var) "]\n\t"
  148. /* Store r17 to @var */
  149. #define RSEQ_ASM_OP_R_STORE(var) \
  150. RSEQ_STORE_LONG(var) "%%r17, %[" __rseq_str(var) "]\n\t"
  151. /* Add @count to r17 */
  152. #define RSEQ_ASM_OP_R_ADD(count) \
  153. "add %%r17, %[" __rseq_str(count) "], %%r17\n\t"
  154. /* Load (r17 + voffp) to r17 */
  155. #define RSEQ_ASM_OP_R_LOADX(voffp) \
  156. RSEQ_LOADX_LONG "%%r17, %[" __rseq_str(voffp) "], %%r17\n\t"
  157. /* TODO: implement a faster memcpy. */
  158. #define RSEQ_ASM_OP_R_MEMCPY() \
  159. RSEQ_CMP_LONG_INT "%%r19, 0\n\t" \
  160. "beq 333f\n\t" \
  161. "addi %%r20, %%r20, -1\n\t" \
  162. "addi %%r21, %%r21, -1\n\t" \
  163. "222:\n\t" \
  164. "lbzu %%r18, 1(%%r20)\n\t" \
  165. "stbu %%r18, 1(%%r21)\n\t" \
  166. "addi %%r19, %%r19, -1\n\t" \
  167. RSEQ_CMP_LONG_INT "%%r19, 0\n\t" \
  168. "bne 222b\n\t" \
  169. "333:\n\t" \
  170. #define RSEQ_ASM_OP_R_FINAL_STORE(var, post_commit_label) \
  171. RSEQ_STORE_LONG(var) "%%r17, %[" __rseq_str(var) "]\n\t" \
  172. __rseq_str(post_commit_label) ":\n\t"
  173. #define RSEQ_ASM_OP_FINAL_STORE(value, var, post_commit_label) \
  174. RSEQ_STORE_LONG(var) "%[" __rseq_str(value) "], %[" __rseq_str(var) "]\n\t" \
  175. __rseq_str(post_commit_label) ":\n\t"
  176. /* Per-cpu-id indexing. */
  177. #define RSEQ_TEMPLATE_CPU_ID
  178. #define RSEQ_TEMPLATE_MO_RELAXED
  179. #include "rseq-ppc-bits.h"
  180. #undef RSEQ_TEMPLATE_MO_RELAXED
  181. #define RSEQ_TEMPLATE_MO_RELEASE
  182. #include "rseq-ppc-bits.h"
  183. #undef RSEQ_TEMPLATE_MO_RELEASE
  184. #undef RSEQ_TEMPLATE_CPU_ID
  185. /* Per-mm-cid indexing. */
  186. #define RSEQ_TEMPLATE_MM_CID
  187. #define RSEQ_TEMPLATE_MO_RELAXED
  188. #include "rseq-ppc-bits.h"
  189. #undef RSEQ_TEMPLATE_MO_RELAXED
  190. #define RSEQ_TEMPLATE_MO_RELEASE
  191. #include "rseq-ppc-bits.h"
  192. #undef RSEQ_TEMPLATE_MO_RELEASE
  193. #undef RSEQ_TEMPLATE_MM_CID
  194. /* APIs which are not based on cpu ids. */
  195. #define RSEQ_TEMPLATE_CPU_ID_NONE
  196. #define RSEQ_TEMPLATE_MO_RELAXED
  197. #include "rseq-ppc-bits.h"
  198. #undef RSEQ_TEMPLATE_MO_RELAXED
  199. #undef RSEQ_TEMPLATE_CPU_ID_NONE