io.h 9.5 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336
  1. /* SPDX-License-Identifier: GPL-2.0-only */
  2. /*
  3. * Based on arch/arm/include/asm/io.h
  4. *
  5. * Copyright (C) 1996-2000 Russell King
  6. * Copyright (C) 2012 ARM Ltd.
  7. */
  8. #ifndef __ASM_IO_H
  9. #define __ASM_IO_H
  10. #include <linux/types.h>
  11. #include <linux/pgtable.h>
  12. #include <asm/byteorder.h>
  13. #include <asm/barrier.h>
  14. #include <asm/memory.h>
  15. #include <asm/early_ioremap.h>
  16. #include <asm/alternative.h>
  17. #include <asm/cpufeature.h>
  18. #include <asm/rsi.h>
  19. /*
  20. * Generic IO read/write. These perform native-endian accesses.
  21. */
  22. #define __raw_writeb __raw_writeb
  23. static __always_inline void __raw_writeb(u8 val, volatile void __iomem *addr)
  24. {
  25. volatile u8 __iomem *ptr = addr;
  26. asm volatile("strb %w0, %1" : : "rZ" (val), "Qo" (*ptr));
  27. }
  28. #define __raw_writew __raw_writew
  29. static __always_inline void __raw_writew(u16 val, volatile void __iomem *addr)
  30. {
  31. volatile u16 __iomem *ptr = addr;
  32. asm volatile("strh %w0, %1" : : "rZ" (val), "Qo" (*ptr));
  33. }
  34. #define __raw_writel __raw_writel
  35. static __always_inline void __raw_writel(u32 val, volatile void __iomem *addr)
  36. {
  37. volatile u32 __iomem *ptr = addr;
  38. asm volatile("str %w0, %1" : : "rZ" (val), "Qo" (*ptr));
  39. }
  40. #define __raw_writeq __raw_writeq
  41. static __always_inline void __raw_writeq(u64 val, volatile void __iomem *addr)
  42. {
  43. volatile u64 __iomem *ptr = addr;
  44. asm volatile("str %x0, %1" : : "rZ" (val), "Qo" (*ptr));
  45. }
  46. #define __raw_readb __raw_readb
  47. static __always_inline u8 __raw_readb(const volatile void __iomem *addr)
  48. {
  49. u8 val;
  50. asm volatile(ALTERNATIVE("ldrb %w0, [%1]",
  51. "ldarb %w0, [%1]",
  52. ARM64_WORKAROUND_DEVICE_LOAD_ACQUIRE)
  53. : "=r" (val) : "r" (addr));
  54. return val;
  55. }
  56. #define __raw_readw __raw_readw
  57. static __always_inline u16 __raw_readw(const volatile void __iomem *addr)
  58. {
  59. u16 val;
  60. asm volatile(ALTERNATIVE("ldrh %w0, [%1]",
  61. "ldarh %w0, [%1]",
  62. ARM64_WORKAROUND_DEVICE_LOAD_ACQUIRE)
  63. : "=r" (val) : "r" (addr));
  64. return val;
  65. }
  66. #define __raw_readl __raw_readl
  67. static __always_inline u32 __raw_readl(const volatile void __iomem *addr)
  68. {
  69. u32 val;
  70. asm volatile(ALTERNATIVE("ldr %w0, [%1]",
  71. "ldar %w0, [%1]",
  72. ARM64_WORKAROUND_DEVICE_LOAD_ACQUIRE)
  73. : "=r" (val) : "r" (addr));
  74. return val;
  75. }
  76. #define __raw_readq __raw_readq
  77. static __always_inline u64 __raw_readq(const volatile void __iomem *addr)
  78. {
  79. u64 val;
  80. asm volatile(ALTERNATIVE("ldr %0, [%1]",
  81. "ldar %0, [%1]",
  82. ARM64_WORKAROUND_DEVICE_LOAD_ACQUIRE)
  83. : "=r" (val) : "r" (addr));
  84. return val;
  85. }
  86. /* IO barriers */
  87. #define __io_ar(v) \
  88. ({ \
  89. unsigned long tmp; \
  90. \
  91. dma_rmb(); \
  92. \
  93. /* \
  94. * Create a dummy control dependency from the IO read to any \
  95. * later instructions. This ensures that a subsequent call to \
  96. * udelay() will be ordered due to the ISB in get_cycles(). \
  97. */ \
  98. asm volatile("eor %0, %1, %1\n" \
  99. "cbnz %0, ." \
  100. : "=r" (tmp) : "r" ((unsigned long)(v)) \
  101. : "memory"); \
  102. })
  103. #define __io_bw() dma_wmb()
  104. #define __io_br(v)
  105. #define __io_aw(v)
  106. /* arm64-specific, don't use in portable drivers */
  107. #define __iormb(v) __io_ar(v)
  108. #define __iowmb() __io_bw()
  109. #define __iomb() dma_mb()
  110. /*
  111. * I/O port access primitives.
  112. */
  113. #define arch_has_dev_port() (1)
  114. #define IO_SPACE_LIMIT (PCI_IO_SIZE - 1)
  115. #define PCI_IOBASE ((void __iomem *)PCI_IO_START)
  116. /*
  117. * The ARM64 iowrite implementation is intended to support drivers that want to
  118. * use write combining. For instance PCI drivers using write combining with a 64
  119. * byte __iowrite64_copy() expect to get a 64 byte MemWr TLP on the PCIe bus.
  120. *
  121. * Newer ARM core have sensitive write combining buffers, it is important that
  122. * the stores be contiguous blocks of store instructions. Normal memcpy
  123. * approaches have a very low chance to generate write combining.
  124. *
  125. * Since this is the only API on ARM64 that should be used with write combining
  126. * it also integrates the DGH hint which is supposed to lower the latency to
  127. * emit the large TLP from the CPU.
  128. */
  129. static __always_inline void
  130. __const_memcpy_toio_aligned32(volatile u32 __iomem *to, const u32 *from,
  131. size_t count)
  132. {
  133. switch (count) {
  134. case 8:
  135. asm volatile("str %w0, [%8, #4 * 0]\n"
  136. "str %w1, [%8, #4 * 1]\n"
  137. "str %w2, [%8, #4 * 2]\n"
  138. "str %w3, [%8, #4 * 3]\n"
  139. "str %w4, [%8, #4 * 4]\n"
  140. "str %w5, [%8, #4 * 5]\n"
  141. "str %w6, [%8, #4 * 6]\n"
  142. "str %w7, [%8, #4 * 7]\n"
  143. :
  144. : "rZ"(from[0]), "rZ"(from[1]), "rZ"(from[2]),
  145. "rZ"(from[3]), "rZ"(from[4]), "rZ"(from[5]),
  146. "rZ"(from[6]), "rZ"(from[7]), "r"(to));
  147. break;
  148. case 4:
  149. asm volatile("str %w0, [%4, #4 * 0]\n"
  150. "str %w1, [%4, #4 * 1]\n"
  151. "str %w2, [%4, #4 * 2]\n"
  152. "str %w3, [%4, #4 * 3]\n"
  153. :
  154. : "rZ"(from[0]), "rZ"(from[1]), "rZ"(from[2]),
  155. "rZ"(from[3]), "r"(to));
  156. break;
  157. case 2:
  158. asm volatile("str %w0, [%2, #4 * 0]\n"
  159. "str %w1, [%2, #4 * 1]\n"
  160. :
  161. : "rZ"(from[0]), "rZ"(from[1]), "r"(to));
  162. break;
  163. case 1:
  164. __raw_writel(*from, to);
  165. break;
  166. default:
  167. BUILD_BUG();
  168. }
  169. }
  170. void __iowrite32_copy_full(void __iomem *to, const void *from, size_t count);
  171. static __always_inline void
  172. __iowrite32_copy(void __iomem *to, const void *from, size_t count)
  173. {
  174. if (__builtin_constant_p(count) &&
  175. (count == 8 || count == 4 || count == 2 || count == 1)) {
  176. __const_memcpy_toio_aligned32(to, from, count);
  177. dgh();
  178. } else {
  179. __iowrite32_copy_full(to, from, count);
  180. }
  181. }
  182. #define __iowrite32_copy __iowrite32_copy
  183. static __always_inline void
  184. __const_memcpy_toio_aligned64(volatile u64 __iomem *to, const u64 *from,
  185. size_t count)
  186. {
  187. switch (count) {
  188. case 8:
  189. asm volatile("str %x0, [%8, #8 * 0]\n"
  190. "str %x1, [%8, #8 * 1]\n"
  191. "str %x2, [%8, #8 * 2]\n"
  192. "str %x3, [%8, #8 * 3]\n"
  193. "str %x4, [%8, #8 * 4]\n"
  194. "str %x5, [%8, #8 * 5]\n"
  195. "str %x6, [%8, #8 * 6]\n"
  196. "str %x7, [%8, #8 * 7]\n"
  197. :
  198. : "rZ"(from[0]), "rZ"(from[1]), "rZ"(from[2]),
  199. "rZ"(from[3]), "rZ"(from[4]), "rZ"(from[5]),
  200. "rZ"(from[6]), "rZ"(from[7]), "r"(to));
  201. break;
  202. case 4:
  203. asm volatile("str %x0, [%4, #8 * 0]\n"
  204. "str %x1, [%4, #8 * 1]\n"
  205. "str %x2, [%4, #8 * 2]\n"
  206. "str %x3, [%4, #8 * 3]\n"
  207. :
  208. : "rZ"(from[0]), "rZ"(from[1]), "rZ"(from[2]),
  209. "rZ"(from[3]), "r"(to));
  210. break;
  211. case 2:
  212. asm volatile("str %x0, [%2, #8 * 0]\n"
  213. "str %x1, [%2, #8 * 1]\n"
  214. :
  215. : "rZ"(from[0]), "rZ"(from[1]), "r"(to));
  216. break;
  217. case 1:
  218. __raw_writeq(*from, to);
  219. break;
  220. default:
  221. BUILD_BUG();
  222. }
  223. }
  224. void __iowrite64_copy_full(void __iomem *to, const void *from, size_t count);
  225. static __always_inline void
  226. __iowrite64_copy(void __iomem *to, const void *from, size_t count)
  227. {
  228. if (__builtin_constant_p(count) &&
  229. (count == 8 || count == 4 || count == 2 || count == 1)) {
  230. __const_memcpy_toio_aligned64(to, from, count);
  231. dgh();
  232. } else {
  233. __iowrite64_copy_full(to, from, count);
  234. }
  235. }
  236. #define __iowrite64_copy __iowrite64_copy
  237. /*
  238. * I/O memory mapping functions.
  239. */
  240. typedef int (*ioremap_prot_hook_t)(phys_addr_t phys_addr, size_t size,
  241. pgprot_t *prot);
  242. int arm64_ioremap_prot_hook_register(const ioremap_prot_hook_t hook);
  243. void __iomem *__ioremap_prot(phys_addr_t phys, size_t size, pgprot_t prot);
  244. static inline void __iomem *ioremap_prot(phys_addr_t phys, size_t size,
  245. pgprot_t user_prot)
  246. {
  247. pgprot_t prot;
  248. ptdesc_t user_prot_val = pgprot_val(user_prot);
  249. if (WARN_ON_ONCE(!(user_prot_val & PTE_USER)))
  250. return NULL;
  251. prot = __pgprot_modify(PAGE_KERNEL, PTE_ATTRINDX_MASK,
  252. user_prot_val & PTE_ATTRINDX_MASK);
  253. return __ioremap_prot(phys, size, prot);
  254. }
  255. #define ioremap_prot ioremap_prot
  256. #define ioremap(addr, size) \
  257. __ioremap_prot((addr), (size), __pgprot(PROT_DEVICE_nGnRE))
  258. #define ioremap_wc(addr, size) \
  259. __ioremap_prot((addr), (size), __pgprot(PROT_NORMAL_NC))
  260. #define ioremap_np(addr, size) \
  261. __ioremap_prot((addr), (size), __pgprot(PROT_DEVICE_nGnRnE))
  262. #define ioremap_encrypted(addr, size) \
  263. __ioremap_prot((addr), (size), PAGE_KERNEL)
  264. /*
  265. * io{read,write}{16,32,64}be() macros
  266. */
  267. #define ioread16be(p) ({ __u16 __v = be16_to_cpu((__force __be16)__raw_readw(p)); __iormb(__v); __v; })
  268. #define ioread32be(p) ({ __u32 __v = be32_to_cpu((__force __be32)__raw_readl(p)); __iormb(__v); __v; })
  269. #define ioread64be(p) ({ __u64 __v = be64_to_cpu((__force __be64)__raw_readq(p)); __iormb(__v); __v; })
  270. #define iowrite16be(v,p) ({ __iowmb(); __raw_writew((__force __u16)cpu_to_be16(v), p); })
  271. #define iowrite32be(v,p) ({ __iowmb(); __raw_writel((__force __u32)cpu_to_be32(v), p); })
  272. #define iowrite64be(v,p) ({ __iowmb(); __raw_writeq((__force __u64)cpu_to_be64(v), p); })
  273. #include <asm-generic/io.h>
  274. #define ioremap_cache ioremap_cache
  275. static inline void __iomem *ioremap_cache(phys_addr_t addr, size_t size)
  276. {
  277. if (pfn_is_map_memory(__phys_to_pfn(addr)))
  278. return (void __iomem *)__phys_to_virt(addr);
  279. return __ioremap_prot(addr, size, __pgprot(PROT_NORMAL));
  280. }
  281. /*
  282. * More restrictive address range checking than the default implementation
  283. * (PHYS_OFFSET and PHYS_MASK taken into account).
  284. */
  285. #define ARCH_HAS_VALID_PHYS_ADDR_RANGE
  286. extern int valid_phys_addr_range(phys_addr_t addr, size_t size);
  287. extern int valid_mmap_phys_addr_range(unsigned long pfn, size_t size);
  288. extern bool arch_memremap_can_ram_remap(resource_size_t offset, size_t size,
  289. unsigned long flags);
  290. #define arch_memremap_can_ram_remap arch_memremap_can_ram_remap
  291. static inline bool arm64_is_protected_mmio(phys_addr_t phys_addr, size_t size)
  292. {
  293. if (unlikely(is_realm_world()))
  294. return arm64_rsi_is_protected(phys_addr, size);
  295. return false;
  296. }
  297. #endif /* __ASM_IO_H */