xref: /linux/drivers/accel/habanalabs/common/hldio.h (revision 58809f614e0e3f4e12b489bddf680bfeb31c0a20)
1*8cbacc9aSKonstantin Sinyuk /* SPDX-License-Identifier: GPL-2.0-only */
2*8cbacc9aSKonstantin Sinyuk /*
3*8cbacc9aSKonstantin Sinyuk  * hldio.h - NVMe Direct I/O (HLDIO) infrastructure for Habana Labs Driver
4*8cbacc9aSKonstantin Sinyuk  *
5*8cbacc9aSKonstantin Sinyuk  * This feature requires specific hardware setup and must not be built
6*8cbacc9aSKonstantin Sinyuk  * under COMPILE_TEST.
7*8cbacc9aSKonstantin Sinyuk  */
8*8cbacc9aSKonstantin Sinyuk 
9*8cbacc9aSKonstantin Sinyuk #ifndef __HL_HLDIO_H__
10*8cbacc9aSKonstantin Sinyuk #define __HL_HLDIO_H__
11*8cbacc9aSKonstantin Sinyuk 
12*8cbacc9aSKonstantin Sinyuk #include <linux/types.h>
13*8cbacc9aSKonstantin Sinyuk #include <linux/fs.h>
14*8cbacc9aSKonstantin Sinyuk #include <linux/seq_file.h>
15*8cbacc9aSKonstantin Sinyuk #include <linux/ktime.h>     /* ktime functions */
16*8cbacc9aSKonstantin Sinyuk #include <linux/delay.h>     /* usleep_range */
17*8cbacc9aSKonstantin Sinyuk #include <linux/kernel.h>    /* might_sleep_if */
18*8cbacc9aSKonstantin Sinyuk #include <linux/errno.h>     /* error codes */
19*8cbacc9aSKonstantin Sinyuk 
20*8cbacc9aSKonstantin Sinyuk /* Forward declarations */
21*8cbacc9aSKonstantin Sinyuk struct hl_device;
22*8cbacc9aSKonstantin Sinyuk struct file;
23*8cbacc9aSKonstantin Sinyuk 
24*8cbacc9aSKonstantin Sinyuk /* Enable only if Kconfig selected */
25*8cbacc9aSKonstantin Sinyuk #ifdef CONFIG_HL_HLDIO
26*8cbacc9aSKonstantin Sinyuk /**
27*8cbacc9aSKonstantin Sinyuk  * struct hl_p2p_region - describes a single P2P memory region
28*8cbacc9aSKonstantin Sinyuk  * @p2ppages: array of page structs for the P2P memory
29*8cbacc9aSKonstantin Sinyuk  * @p2pmem: virtual address of the P2P memory region
30*8cbacc9aSKonstantin Sinyuk  * @device_pa: physical address on the device
31*8cbacc9aSKonstantin Sinyuk  * @bar_offset: offset within the BAR
32*8cbacc9aSKonstantin Sinyuk  * @size: size of the region in bytes
33*8cbacc9aSKonstantin Sinyuk  * @bar: BAR number containing this region
34*8cbacc9aSKonstantin Sinyuk  */
35*8cbacc9aSKonstantin Sinyuk struct hl_p2p_region {
36*8cbacc9aSKonstantin Sinyuk 	struct page **p2ppages;
37*8cbacc9aSKonstantin Sinyuk 	void *p2pmem;
38*8cbacc9aSKonstantin Sinyuk 	u64 device_pa;
39*8cbacc9aSKonstantin Sinyuk 	u64 bar_offset;
40*8cbacc9aSKonstantin Sinyuk 	u64 size;
41*8cbacc9aSKonstantin Sinyuk 	int bar;
42*8cbacc9aSKonstantin Sinyuk };
43*8cbacc9aSKonstantin Sinyuk 
44*8cbacc9aSKonstantin Sinyuk /**
45*8cbacc9aSKonstantin Sinyuk  * struct hl_dio_stats - Direct I/O statistics
46*8cbacc9aSKonstantin Sinyuk  * @total_ops: total number of operations attempted
47*8cbacc9aSKonstantin Sinyuk  * @successful_ops: number of successful operations
48*8cbacc9aSKonstantin Sinyuk  * @failed_ops: number of failed operations
49*8cbacc9aSKonstantin Sinyuk  * @bytes_transferred: total bytes successfully transferred
50*8cbacc9aSKonstantin Sinyuk  * @last_len_read: length of the last read operation
51*8cbacc9aSKonstantin Sinyuk  */
52*8cbacc9aSKonstantin Sinyuk struct hl_dio_stats {
53*8cbacc9aSKonstantin Sinyuk 	u64 total_ops;
54*8cbacc9aSKonstantin Sinyuk 	u64 successful_ops;
55*8cbacc9aSKonstantin Sinyuk 	u64 failed_ops;
56*8cbacc9aSKonstantin Sinyuk 	u64 bytes_transferred;
57*8cbacc9aSKonstantin Sinyuk 	size_t last_len_read;
58*8cbacc9aSKonstantin Sinyuk };
59*8cbacc9aSKonstantin Sinyuk 
60*8cbacc9aSKonstantin Sinyuk /**
61*8cbacc9aSKonstantin Sinyuk  * struct hl_dio - describes habanalabs direct storage interaction interface
62*8cbacc9aSKonstantin Sinyuk  * @p2prs: array of p2p regions
63*8cbacc9aSKonstantin Sinyuk  * @inflight_ios: percpu counter for inflight ios
64*8cbacc9aSKonstantin Sinyuk  * @np2prs: number of elements in p2prs
65*8cbacc9aSKonstantin Sinyuk  * @io_enabled: 1 if io is enabled 0 otherwise
66*8cbacc9aSKonstantin Sinyuk  */
67*8cbacc9aSKonstantin Sinyuk struct hl_dio {
68*8cbacc9aSKonstantin Sinyuk 	struct hl_p2p_region *p2prs;
69*8cbacc9aSKonstantin Sinyuk 	s64 __percpu *inflight_ios;
70*8cbacc9aSKonstantin Sinyuk 	u8 np2prs;
71*8cbacc9aSKonstantin Sinyuk 	u8 io_enabled;
72*8cbacc9aSKonstantin Sinyuk };
73*8cbacc9aSKonstantin Sinyuk 
74*8cbacc9aSKonstantin Sinyuk int hl_dio_ssd2hl(struct hl_device *hdev, struct hl_ctx *ctx, int fd,
75*8cbacc9aSKonstantin Sinyuk 		  u64 device_va, off_t off_bytes, size_t len_bytes,
76*8cbacc9aSKonstantin Sinyuk 		  size_t *len_read);
77*8cbacc9aSKonstantin Sinyuk void hl_p2p_region_fini_all(struct hl_device *hdev);
78*8cbacc9aSKonstantin Sinyuk int hl_p2p_region_init(struct hl_device *hdev, struct hl_p2p_region *p2pr);
79*8cbacc9aSKonstantin Sinyuk int hl_dio_start(struct hl_device *hdev);
80*8cbacc9aSKonstantin Sinyuk void hl_dio_stop(struct hl_device *hdev);
81*8cbacc9aSKonstantin Sinyuk 
82*8cbacc9aSKonstantin Sinyuk /* Init/teardown */
83*8cbacc9aSKonstantin Sinyuk int hl_hldio_init(struct hl_device *hdev);
84*8cbacc9aSKonstantin Sinyuk void hl_hldio_fini(struct hl_device *hdev);
85*8cbacc9aSKonstantin Sinyuk 
86*8cbacc9aSKonstantin Sinyuk /* File operations */
87*8cbacc9aSKonstantin Sinyuk long hl_hldio_ioctl(struct file *filep, unsigned int cmd, unsigned long arg);
88*8cbacc9aSKonstantin Sinyuk 
89*8cbacc9aSKonstantin Sinyuk /* DebugFS hooks */
90*8cbacc9aSKonstantin Sinyuk #ifdef CONFIG_DEBUG_FS
91*8cbacc9aSKonstantin Sinyuk void hl_hldio_debugfs_init(struct hl_device *hdev);
92*8cbacc9aSKonstantin Sinyuk void hl_hldio_debugfs_fini(struct hl_device *hdev);
93*8cbacc9aSKonstantin Sinyuk #else
94*8cbacc9aSKonstantin Sinyuk static inline void hl_hldio_debugfs_init(struct hl_device *hdev) { }
95*8cbacc9aSKonstantin Sinyuk static inline void hl_hldio_debugfs_fini(struct hl_device *hdev) { }
96*8cbacc9aSKonstantin Sinyuk #endif
97*8cbacc9aSKonstantin Sinyuk 
98*8cbacc9aSKonstantin Sinyuk #else /* !CONFIG_HL_HLDIO */
99*8cbacc9aSKonstantin Sinyuk 
100*8cbacc9aSKonstantin Sinyuk struct hl_p2p_region;
101*8cbacc9aSKonstantin Sinyuk /* Stubs when HLDIO is disabled */
102*8cbacc9aSKonstantin Sinyuk static inline int hl_dio_ssd2hl(struct hl_device *hdev, struct hl_ctx *ctx, int fd,
103*8cbacc9aSKonstantin Sinyuk 		  u64 device_va, off_t off_bytes, size_t len_bytes,
104*8cbacc9aSKonstantin Sinyuk 		  size_t *len_read)
105*8cbacc9aSKonstantin Sinyuk { return -EOPNOTSUPP; }
106*8cbacc9aSKonstantin Sinyuk static inline void hl_p2p_region_fini_all(struct hl_device *hdev) {}
107*8cbacc9aSKonstantin Sinyuk static inline int hl_p2p_region_init(struct hl_device *hdev, struct hl_p2p_region *p2pr)
108*8cbacc9aSKonstantin Sinyuk { return -EOPNOTSUPP; }
109*8cbacc9aSKonstantin Sinyuk static inline int hl_dio_start(struct hl_device *hdev) { return -EOPNOTSUPP; }
110*8cbacc9aSKonstantin Sinyuk static inline void hl_dio_stop(struct hl_device *hdev) {}
111*8cbacc9aSKonstantin Sinyuk 
112*8cbacc9aSKonstantin Sinyuk static inline int hl_hldio_init(struct hl_device *hdev) { return 0; }
113*8cbacc9aSKonstantin Sinyuk static inline void hl_hldio_fini(struct hl_device *hdev) { }
114*8cbacc9aSKonstantin Sinyuk static inline long hl_hldio_ioctl(struct file *f, unsigned int c,
115*8cbacc9aSKonstantin Sinyuk 				  unsigned long a)
116*8cbacc9aSKonstantin Sinyuk { return -ENOTTY; }
117*8cbacc9aSKonstantin Sinyuk static inline void hl_hldio_debugfs_init(struct hl_device *hdev) { }
118*8cbacc9aSKonstantin Sinyuk static inline void hl_hldio_debugfs_fini(struct hl_device *hdev) { }
119*8cbacc9aSKonstantin Sinyuk 
120*8cbacc9aSKonstantin Sinyuk #endif /* CONFIG_HL_HLDIO */
121*8cbacc9aSKonstantin Sinyuk 
122*8cbacc9aSKonstantin Sinyuk /* Simplified polling macro for HLDIO (no simulator support) */
123*8cbacc9aSKonstantin Sinyuk #define hl_poll_timeout_condition(hdev, cond, sleep_us, timeout_us) \
124*8cbacc9aSKonstantin Sinyuk ({ \
125*8cbacc9aSKonstantin Sinyuk 	ktime_t __timeout = ktime_add_us(ktime_get(), timeout_us); \
126*8cbacc9aSKonstantin Sinyuk 	might_sleep_if(sleep_us); \
127*8cbacc9aSKonstantin Sinyuk 	(void)(hdev); /* keep signature consistent, hdev unused */ \
128*8cbacc9aSKonstantin Sinyuk 	for (;;) { \
129*8cbacc9aSKonstantin Sinyuk 		mb(); /* ensure ordering of memory operations */ \
130*8cbacc9aSKonstantin Sinyuk 		if (cond) \
131*8cbacc9aSKonstantin Sinyuk 			break; \
132*8cbacc9aSKonstantin Sinyuk 		if (timeout_us && ktime_compare(ktime_get(), __timeout) > 0) \
133*8cbacc9aSKonstantin Sinyuk 			break; \
134*8cbacc9aSKonstantin Sinyuk 		if (sleep_us) \
135*8cbacc9aSKonstantin Sinyuk 			usleep_range((sleep_us >> 2) + 1, sleep_us); \
136*8cbacc9aSKonstantin Sinyuk 	} \
137*8cbacc9aSKonstantin Sinyuk 	(cond) ? 0 : -ETIMEDOUT; \
138*8cbacc9aSKonstantin Sinyuk })
139*8cbacc9aSKonstantin Sinyuk 
140*8cbacc9aSKonstantin Sinyuk #ifdef CONFIG_HL_HLDIO
141*8cbacc9aSKonstantin Sinyuk bool hl_device_supports_nvme(struct hl_device *hdev);
142*8cbacc9aSKonstantin Sinyuk #else
143*8cbacc9aSKonstantin Sinyuk static inline bool hl_device_supports_nvme(struct hl_device *hdev) { return false; }
144*8cbacc9aSKonstantin Sinyuk #endif
145*8cbacc9aSKonstantin Sinyuk 
146*8cbacc9aSKonstantin Sinyuk #endif /* __HL_HLDIO_H__ */
147