1 /* SPDX-License-Identifier: GPL-2.0-only */
2 /*
3 * Based on arch/arm/include/asm/io.h
4 *
5 * Copyright (C) 1996-2000 Russell King
6 * Copyright (C) 2012 ARM Ltd.
7 */
8 #ifndef __ASM_IO_H
9 #define __ASM_IO_H
10
11 #include <linux/types.h>
12 #include <linux/pgtable.h>
13
14 #include <asm/byteorder.h>
15 #include <asm/barrier.h>
16 #include <asm/memory.h>
17 #include <asm/early_ioremap.h>
18 #include <asm/alternative.h>
19 #include <asm/cpufeature.h>
20
21 /*
22 * Generic IO read/write. These perform native-endian accesses.
23 */
24 #define __raw_writeb __raw_writeb
__raw_writeb(u8 val,volatile void __iomem * addr)25 static __always_inline void __raw_writeb(u8 val, volatile void __iomem *addr)
26 {
27 volatile u8 __iomem *ptr = addr;
28 asm volatile("strb %w0, %1" : : "rZ" (val), "Qo" (*ptr));
29 }
30
31 #define __raw_writew __raw_writew
__raw_writew(u16 val,volatile void __iomem * addr)32 static __always_inline void __raw_writew(u16 val, volatile void __iomem *addr)
33 {
34 volatile u16 __iomem *ptr = addr;
35 asm volatile("strh %w0, %1" : : "rZ" (val), "Qo" (*ptr));
36 }
37
38 #define __raw_writel __raw_writel
__raw_writel(u32 val,volatile void __iomem * addr)39 static __always_inline void __raw_writel(u32 val, volatile void __iomem *addr)
40 {
41 volatile u32 __iomem *ptr = addr;
42 asm volatile("str %w0, %1" : : "rZ" (val), "Qo" (*ptr));
43 }
44
45 #define __raw_writeq __raw_writeq
__raw_writeq(u64 val,volatile void __iomem * addr)46 static __always_inline void __raw_writeq(u64 val, volatile void __iomem *addr)
47 {
48 volatile u64 __iomem *ptr = addr;
49 asm volatile("str %x0, %1" : : "rZ" (val), "Qo" (*ptr));
50 }
51
52 #define __raw_readb __raw_readb
__raw_readb(const volatile void __iomem * addr)53 static __always_inline u8 __raw_readb(const volatile void __iomem *addr)
54 {
55 u8 val;
56 asm volatile(ALTERNATIVE("ldrb %w0, [%1]",
57 "ldarb %w0, [%1]",
58 ARM64_WORKAROUND_DEVICE_LOAD_ACQUIRE)
59 : "=r" (val) : "r" (addr));
60 return val;
61 }
62
63 #define __raw_readw __raw_readw
__raw_readw(const volatile void __iomem * addr)64 static __always_inline u16 __raw_readw(const volatile void __iomem *addr)
65 {
66 u16 val;
67
68 asm volatile(ALTERNATIVE("ldrh %w0, [%1]",
69 "ldarh %w0, [%1]",
70 ARM64_WORKAROUND_DEVICE_LOAD_ACQUIRE)
71 : "=r" (val) : "r" (addr));
72 return val;
73 }
74
75 #define __raw_readl __raw_readl
__raw_readl(const volatile void __iomem * addr)76 static __always_inline u32 __raw_readl(const volatile void __iomem *addr)
77 {
78 u32 val;
79 asm volatile(ALTERNATIVE("ldr %w0, [%1]",
80 "ldar %w0, [%1]",
81 ARM64_WORKAROUND_DEVICE_LOAD_ACQUIRE)
82 : "=r" (val) : "r" (addr));
83 return val;
84 }
85
86 #define __raw_readq __raw_readq
__raw_readq(const volatile void __iomem * addr)87 static __always_inline u64 __raw_readq(const volatile void __iomem *addr)
88 {
89 u64 val;
90 asm volatile(ALTERNATIVE("ldr %0, [%1]",
91 "ldar %0, [%1]",
92 ARM64_WORKAROUND_DEVICE_LOAD_ACQUIRE)
93 : "=r" (val) : "r" (addr));
94 return val;
95 }
96
97 /* IO barriers */
98 #define __io_ar(v) \
99 ({ \
100 unsigned long tmp; \
101 \
102 dma_rmb(); \
103 \
104 /* \
105 * Create a dummy control dependency from the IO read to any \
106 * later instructions. This ensures that a subsequent call to \
107 * udelay() will be ordered due to the ISB in get_cycles(). \
108 */ \
109 asm volatile("eor %0, %1, %1\n" \
110 "cbnz %0, ." \
111 : "=r" (tmp) : "r" ((unsigned long)(v)) \
112 : "memory"); \
113 })
114
115 #define __io_bw() dma_wmb()
116 #define __io_br(v)
117 #define __io_aw(v)
118
119 /* arm64-specific, don't use in portable drivers */
120 #define __iormb(v) __io_ar(v)
121 #define __iowmb() __io_bw()
122 #define __iomb() dma_mb()
123
124 /*
125 * I/O port access primitives.
126 */
127 #define arch_has_dev_port() (1)
128 #define IO_SPACE_LIMIT (PCI_IO_SIZE - 1)
129 #define PCI_IOBASE ((void __iomem *)PCI_IO_START)
130
131 /*
132 * String version of I/O memory access operations.
133 */
134 extern void __memcpy_fromio(void *, const volatile void __iomem *, size_t);
135 extern void __memcpy_toio(volatile void __iomem *, const void *, size_t);
136 extern void __memset_io(volatile void __iomem *, int, size_t);
137
138 #define memset_io(c,v,l) __memset_io((c),(v),(l))
139 #define memcpy_fromio(a,c,l) __memcpy_fromio((a),(c),(l))
140 #define memcpy_toio(c,a,l) __memcpy_toio((c),(a),(l))
141
142 /*
143 * The ARM64 iowrite implementation is intended to support drivers that want to
144 * use write combining. For instance PCI drivers using write combining with a 64
145 * byte __iowrite64_copy() expect to get a 64 byte MemWr TLP on the PCIe bus.
146 *
147 * Newer ARM core have sensitive write combining buffers, it is important that
148 * the stores be contiguous blocks of store instructions. Normal memcpy
149 * approaches have a very low chance to generate write combining.
150 *
151 * Since this is the only API on ARM64 that should be used with write combining
152 * it also integrates the DGH hint which is supposed to lower the latency to
153 * emit the large TLP from the CPU.
154 */
155
156 static __always_inline void
__const_memcpy_toio_aligned32(volatile u32 __iomem * to,const u32 * from,size_t count)157 __const_memcpy_toio_aligned32(volatile u32 __iomem *to, const u32 *from,
158 size_t count)
159 {
160 switch (count) {
161 case 8:
162 asm volatile("str %w0, [%8, #4 * 0]\n"
163 "str %w1, [%8, #4 * 1]\n"
164 "str %w2, [%8, #4 * 2]\n"
165 "str %w3, [%8, #4 * 3]\n"
166 "str %w4, [%8, #4 * 4]\n"
167 "str %w5, [%8, #4 * 5]\n"
168 "str %w6, [%8, #4 * 6]\n"
169 "str %w7, [%8, #4 * 7]\n"
170 :
171 : "rZ"(from[0]), "rZ"(from[1]), "rZ"(from[2]),
172 "rZ"(from[3]), "rZ"(from[4]), "rZ"(from[5]),
173 "rZ"(from[6]), "rZ"(from[7]), "r"(to));
174 break;
175 case 4:
176 asm volatile("str %w0, [%4, #4 * 0]\n"
177 "str %w1, [%4, #4 * 1]\n"
178 "str %w2, [%4, #4 * 2]\n"
179 "str %w3, [%4, #4 * 3]\n"
180 :
181 : "rZ"(from[0]), "rZ"(from[1]), "rZ"(from[2]),
182 "rZ"(from[3]), "r"(to));
183 break;
184 case 2:
185 asm volatile("str %w0, [%2, #4 * 0]\n"
186 "str %w1, [%2, #4 * 1]\n"
187 :
188 : "rZ"(from[0]), "rZ"(from[1]), "r"(to));
189 break;
190 case 1:
191 __raw_writel(*from, to);
192 break;
193 default:
194 BUILD_BUG();
195 }
196 }
197
198 void __iowrite32_copy_full(void __iomem *to, const void *from, size_t count);
199
200 static __always_inline void
__iowrite32_copy(void __iomem * to,const void * from,size_t count)201 __iowrite32_copy(void __iomem *to, const void *from, size_t count)
202 {
203 if (__builtin_constant_p(count) &&
204 (count == 8 || count == 4 || count == 2 || count == 1)) {
205 __const_memcpy_toio_aligned32(to, from, count);
206 dgh();
207 } else {
208 __iowrite32_copy_full(to, from, count);
209 }
210 }
211 #define __iowrite32_copy __iowrite32_copy
212
213 static __always_inline void
__const_memcpy_toio_aligned64(volatile u64 __iomem * to,const u64 * from,size_t count)214 __const_memcpy_toio_aligned64(volatile u64 __iomem *to, const u64 *from,
215 size_t count)
216 {
217 switch (count) {
218 case 8:
219 asm volatile("str %x0, [%8, #8 * 0]\n"
220 "str %x1, [%8, #8 * 1]\n"
221 "str %x2, [%8, #8 * 2]\n"
222 "str %x3, [%8, #8 * 3]\n"
223 "str %x4, [%8, #8 * 4]\n"
224 "str %x5, [%8, #8 * 5]\n"
225 "str %x6, [%8, #8 * 6]\n"
226 "str %x7, [%8, #8 * 7]\n"
227 :
228 : "rZ"(from[0]), "rZ"(from[1]), "rZ"(from[2]),
229 "rZ"(from[3]), "rZ"(from[4]), "rZ"(from[5]),
230 "rZ"(from[6]), "rZ"(from[7]), "r"(to));
231 break;
232 case 4:
233 asm volatile("str %x0, [%4, #8 * 0]\n"
234 "str %x1, [%4, #8 * 1]\n"
235 "str %x2, [%4, #8 * 2]\n"
236 "str %x3, [%4, #8 * 3]\n"
237 :
238 : "rZ"(from[0]), "rZ"(from[1]), "rZ"(from[2]),
239 "rZ"(from[3]), "r"(to));
240 break;
241 case 2:
242 asm volatile("str %x0, [%2, #8 * 0]\n"
243 "str %x1, [%2, #8 * 1]\n"
244 :
245 : "rZ"(from[0]), "rZ"(from[1]), "r"(to));
246 break;
247 case 1:
248 __raw_writeq(*from, to);
249 break;
250 default:
251 BUILD_BUG();
252 }
253 }
254
255 void __iowrite64_copy_full(void __iomem *to, const void *from, size_t count);
256
257 static __always_inline void
__iowrite64_copy(void __iomem * to,const void * from,size_t count)258 __iowrite64_copy(void __iomem *to, const void *from, size_t count)
259 {
260 if (__builtin_constant_p(count) &&
261 (count == 8 || count == 4 || count == 2 || count == 1)) {
262 __const_memcpy_toio_aligned64(to, from, count);
263 dgh();
264 } else {
265 __iowrite64_copy_full(to, from, count);
266 }
267 }
268 #define __iowrite64_copy __iowrite64_copy
269
270 /*
271 * I/O memory mapping functions.
272 */
273
274 typedef int (*ioremap_prot_hook_t)(phys_addr_t phys_addr, size_t size,
275 pgprot_t *prot);
276 int arm64_ioremap_prot_hook_register(const ioremap_prot_hook_t hook);
277
278 #define ioremap_prot ioremap_prot
279
280 #define _PAGE_IOREMAP PROT_DEVICE_nGnRE
281
282 #define ioremap_wc(addr, size) \
283 ioremap_prot((addr), (size), PROT_NORMAL_NC)
284 #define ioremap_np(addr, size) \
285 ioremap_prot((addr), (size), PROT_DEVICE_nGnRnE)
286
287 /*
288 * io{read,write}{16,32,64}be() macros
289 */
290 #define ioread16be(p) ({ __u16 __v = be16_to_cpu((__force __be16)__raw_readw(p)); __iormb(__v); __v; })
291 #define ioread32be(p) ({ __u32 __v = be32_to_cpu((__force __be32)__raw_readl(p)); __iormb(__v); __v; })
292 #define ioread64be(p) ({ __u64 __v = be64_to_cpu((__force __be64)__raw_readq(p)); __iormb(__v); __v; })
293
294 #define iowrite16be(v,p) ({ __iowmb(); __raw_writew((__force __u16)cpu_to_be16(v), p); })
295 #define iowrite32be(v,p) ({ __iowmb(); __raw_writel((__force __u32)cpu_to_be32(v), p); })
296 #define iowrite64be(v,p) ({ __iowmb(); __raw_writeq((__force __u64)cpu_to_be64(v), p); })
297
298 #include <asm-generic/io.h>
299
300 #define ioremap_cache ioremap_cache
ioremap_cache(phys_addr_t addr,size_t size)301 static inline void __iomem *ioremap_cache(phys_addr_t addr, size_t size)
302 {
303 if (pfn_is_map_memory(__phys_to_pfn(addr)))
304 return (void __iomem *)__phys_to_virt(addr);
305
306 return ioremap_prot(addr, size, PROT_NORMAL);
307 }
308
309 /*
310 * More restrictive address range checking than the default implementation
311 * (PHYS_OFFSET and PHYS_MASK taken into account).
312 */
313 #define ARCH_HAS_VALID_PHYS_ADDR_RANGE
314 extern int valid_phys_addr_range(phys_addr_t addr, size_t size);
315 extern int valid_mmap_phys_addr_range(unsigned long pfn, size_t size);
316
317 extern bool arch_memremap_can_ram_remap(resource_size_t offset, size_t size,
318 unsigned long flags);
319 #define arch_memremap_can_ram_remap arch_memremap_can_ram_remap
320
321 #endif /* __ASM_IO_H */
322