1*8cbacc9aSKonstantin Sinyuk /* SPDX-License-Identifier: GPL-2.0-only */ 2*8cbacc9aSKonstantin Sinyuk /* 3*8cbacc9aSKonstantin Sinyuk * hldio.h - NVMe Direct I/O (HLDIO) infrastructure for Habana Labs Driver 4*8cbacc9aSKonstantin Sinyuk * 5*8cbacc9aSKonstantin Sinyuk * This feature requires specific hardware setup and must not be built 6*8cbacc9aSKonstantin Sinyuk * under COMPILE_TEST. 7*8cbacc9aSKonstantin Sinyuk */ 8*8cbacc9aSKonstantin Sinyuk 9*8cbacc9aSKonstantin Sinyuk #ifndef __HL_HLDIO_H__ 10*8cbacc9aSKonstantin Sinyuk #define __HL_HLDIO_H__ 11*8cbacc9aSKonstantin Sinyuk 12*8cbacc9aSKonstantin Sinyuk #include <linux/types.h> 13*8cbacc9aSKonstantin Sinyuk #include <linux/fs.h> 14*8cbacc9aSKonstantin Sinyuk #include <linux/seq_file.h> 15*8cbacc9aSKonstantin Sinyuk #include <linux/ktime.h> /* ktime functions */ 16*8cbacc9aSKonstantin Sinyuk #include <linux/delay.h> /* usleep_range */ 17*8cbacc9aSKonstantin Sinyuk #include <linux/kernel.h> /* might_sleep_if */ 18*8cbacc9aSKonstantin Sinyuk #include <linux/errno.h> /* error codes */ 19*8cbacc9aSKonstantin Sinyuk 20*8cbacc9aSKonstantin Sinyuk /* Forward declarations */ 21*8cbacc9aSKonstantin Sinyuk struct hl_device; 22*8cbacc9aSKonstantin Sinyuk struct file; 23*8cbacc9aSKonstantin Sinyuk 24*8cbacc9aSKonstantin Sinyuk /* Enable only if Kconfig selected */ 25*8cbacc9aSKonstantin Sinyuk #ifdef CONFIG_HL_HLDIO 26*8cbacc9aSKonstantin Sinyuk /** 27*8cbacc9aSKonstantin Sinyuk * struct hl_p2p_region - describes a single P2P memory region 28*8cbacc9aSKonstantin Sinyuk * @p2ppages: array of page structs for the P2P memory 29*8cbacc9aSKonstantin Sinyuk * @p2pmem: virtual address of the P2P memory region 30*8cbacc9aSKonstantin Sinyuk * @device_pa: physical address on the device 31*8cbacc9aSKonstantin Sinyuk * @bar_offset: offset within the BAR 32*8cbacc9aSKonstantin Sinyuk * @size: size of the region in bytes 33*8cbacc9aSKonstantin Sinyuk * @bar: BAR number containing this region 34*8cbacc9aSKonstantin Sinyuk */ 35*8cbacc9aSKonstantin Sinyuk struct hl_p2p_region { 36*8cbacc9aSKonstantin Sinyuk struct page **p2ppages; 37*8cbacc9aSKonstantin Sinyuk void *p2pmem; 38*8cbacc9aSKonstantin Sinyuk u64 device_pa; 39*8cbacc9aSKonstantin Sinyuk u64 bar_offset; 40*8cbacc9aSKonstantin Sinyuk u64 size; 41*8cbacc9aSKonstantin Sinyuk int bar; 42*8cbacc9aSKonstantin Sinyuk }; 43*8cbacc9aSKonstantin Sinyuk 44*8cbacc9aSKonstantin Sinyuk /** 45*8cbacc9aSKonstantin Sinyuk * struct hl_dio_stats - Direct I/O statistics 46*8cbacc9aSKonstantin Sinyuk * @total_ops: total number of operations attempted 47*8cbacc9aSKonstantin Sinyuk * @successful_ops: number of successful operations 48*8cbacc9aSKonstantin Sinyuk * @failed_ops: number of failed operations 49*8cbacc9aSKonstantin Sinyuk * @bytes_transferred: total bytes successfully transferred 50*8cbacc9aSKonstantin Sinyuk * @last_len_read: length of the last read operation 51*8cbacc9aSKonstantin Sinyuk */ 52*8cbacc9aSKonstantin Sinyuk struct hl_dio_stats { 53*8cbacc9aSKonstantin Sinyuk u64 total_ops; 54*8cbacc9aSKonstantin Sinyuk u64 successful_ops; 55*8cbacc9aSKonstantin Sinyuk u64 failed_ops; 56*8cbacc9aSKonstantin Sinyuk u64 bytes_transferred; 57*8cbacc9aSKonstantin Sinyuk size_t last_len_read; 58*8cbacc9aSKonstantin Sinyuk }; 59*8cbacc9aSKonstantin Sinyuk 60*8cbacc9aSKonstantin Sinyuk /** 61*8cbacc9aSKonstantin Sinyuk * struct hl_dio - describes habanalabs direct storage interaction interface 62*8cbacc9aSKonstantin Sinyuk * @p2prs: array of p2p regions 63*8cbacc9aSKonstantin Sinyuk * @inflight_ios: percpu counter for inflight ios 64*8cbacc9aSKonstantin Sinyuk * @np2prs: number of elements in p2prs 65*8cbacc9aSKonstantin Sinyuk * @io_enabled: 1 if io is enabled 0 otherwise 66*8cbacc9aSKonstantin Sinyuk */ 67*8cbacc9aSKonstantin Sinyuk struct hl_dio { 68*8cbacc9aSKonstantin Sinyuk struct hl_p2p_region *p2prs; 69*8cbacc9aSKonstantin Sinyuk s64 __percpu *inflight_ios; 70*8cbacc9aSKonstantin Sinyuk u8 np2prs; 71*8cbacc9aSKonstantin Sinyuk u8 io_enabled; 72*8cbacc9aSKonstantin Sinyuk }; 73*8cbacc9aSKonstantin Sinyuk 74*8cbacc9aSKonstantin Sinyuk int hl_dio_ssd2hl(struct hl_device *hdev, struct hl_ctx *ctx, int fd, 75*8cbacc9aSKonstantin Sinyuk u64 device_va, off_t off_bytes, size_t len_bytes, 76*8cbacc9aSKonstantin Sinyuk size_t *len_read); 77*8cbacc9aSKonstantin Sinyuk void hl_p2p_region_fini_all(struct hl_device *hdev); 78*8cbacc9aSKonstantin Sinyuk int hl_p2p_region_init(struct hl_device *hdev, struct hl_p2p_region *p2pr); 79*8cbacc9aSKonstantin Sinyuk int hl_dio_start(struct hl_device *hdev); 80*8cbacc9aSKonstantin Sinyuk void hl_dio_stop(struct hl_device *hdev); 81*8cbacc9aSKonstantin Sinyuk 82*8cbacc9aSKonstantin Sinyuk /* Init/teardown */ 83*8cbacc9aSKonstantin Sinyuk int hl_hldio_init(struct hl_device *hdev); 84*8cbacc9aSKonstantin Sinyuk void hl_hldio_fini(struct hl_device *hdev); 85*8cbacc9aSKonstantin Sinyuk 86*8cbacc9aSKonstantin Sinyuk /* File operations */ 87*8cbacc9aSKonstantin Sinyuk long hl_hldio_ioctl(struct file *filep, unsigned int cmd, unsigned long arg); 88*8cbacc9aSKonstantin Sinyuk 89*8cbacc9aSKonstantin Sinyuk /* DebugFS hooks */ 90*8cbacc9aSKonstantin Sinyuk #ifdef CONFIG_DEBUG_FS 91*8cbacc9aSKonstantin Sinyuk void hl_hldio_debugfs_init(struct hl_device *hdev); 92*8cbacc9aSKonstantin Sinyuk void hl_hldio_debugfs_fini(struct hl_device *hdev); 93*8cbacc9aSKonstantin Sinyuk #else 94*8cbacc9aSKonstantin Sinyuk static inline void hl_hldio_debugfs_init(struct hl_device *hdev) { } 95*8cbacc9aSKonstantin Sinyuk static inline void hl_hldio_debugfs_fini(struct hl_device *hdev) { } 96*8cbacc9aSKonstantin Sinyuk #endif 97*8cbacc9aSKonstantin Sinyuk 98*8cbacc9aSKonstantin Sinyuk #else /* !CONFIG_HL_HLDIO */ 99*8cbacc9aSKonstantin Sinyuk 100*8cbacc9aSKonstantin Sinyuk struct hl_p2p_region; 101*8cbacc9aSKonstantin Sinyuk /* Stubs when HLDIO is disabled */ 102*8cbacc9aSKonstantin Sinyuk static inline int hl_dio_ssd2hl(struct hl_device *hdev, struct hl_ctx *ctx, int fd, 103*8cbacc9aSKonstantin Sinyuk u64 device_va, off_t off_bytes, size_t len_bytes, 104*8cbacc9aSKonstantin Sinyuk size_t *len_read) 105*8cbacc9aSKonstantin Sinyuk { return -EOPNOTSUPP; } 106*8cbacc9aSKonstantin Sinyuk static inline void hl_p2p_region_fini_all(struct hl_device *hdev) {} 107*8cbacc9aSKonstantin Sinyuk static inline int hl_p2p_region_init(struct hl_device *hdev, struct hl_p2p_region *p2pr) 108*8cbacc9aSKonstantin Sinyuk { return -EOPNOTSUPP; } 109*8cbacc9aSKonstantin Sinyuk static inline int hl_dio_start(struct hl_device *hdev) { return -EOPNOTSUPP; } 110*8cbacc9aSKonstantin Sinyuk static inline void hl_dio_stop(struct hl_device *hdev) {} 111*8cbacc9aSKonstantin Sinyuk 112*8cbacc9aSKonstantin Sinyuk static inline int hl_hldio_init(struct hl_device *hdev) { return 0; } 113*8cbacc9aSKonstantin Sinyuk static inline void hl_hldio_fini(struct hl_device *hdev) { } 114*8cbacc9aSKonstantin Sinyuk static inline long hl_hldio_ioctl(struct file *f, unsigned int c, 115*8cbacc9aSKonstantin Sinyuk unsigned long a) 116*8cbacc9aSKonstantin Sinyuk { return -ENOTTY; } 117*8cbacc9aSKonstantin Sinyuk static inline void hl_hldio_debugfs_init(struct hl_device *hdev) { } 118*8cbacc9aSKonstantin Sinyuk static inline void hl_hldio_debugfs_fini(struct hl_device *hdev) { } 119*8cbacc9aSKonstantin Sinyuk 120*8cbacc9aSKonstantin Sinyuk #endif /* CONFIG_HL_HLDIO */ 121*8cbacc9aSKonstantin Sinyuk 122*8cbacc9aSKonstantin Sinyuk /* Simplified polling macro for HLDIO (no simulator support) */ 123*8cbacc9aSKonstantin Sinyuk #define hl_poll_timeout_condition(hdev, cond, sleep_us, timeout_us) \ 124*8cbacc9aSKonstantin Sinyuk ({ \ 125*8cbacc9aSKonstantin Sinyuk ktime_t __timeout = ktime_add_us(ktime_get(), timeout_us); \ 126*8cbacc9aSKonstantin Sinyuk might_sleep_if(sleep_us); \ 127*8cbacc9aSKonstantin Sinyuk (void)(hdev); /* keep signature consistent, hdev unused */ \ 128*8cbacc9aSKonstantin Sinyuk for (;;) { \ 129*8cbacc9aSKonstantin Sinyuk mb(); /* ensure ordering of memory operations */ \ 130*8cbacc9aSKonstantin Sinyuk if (cond) \ 131*8cbacc9aSKonstantin Sinyuk break; \ 132*8cbacc9aSKonstantin Sinyuk if (timeout_us && ktime_compare(ktime_get(), __timeout) > 0) \ 133*8cbacc9aSKonstantin Sinyuk break; \ 134*8cbacc9aSKonstantin Sinyuk if (sleep_us) \ 135*8cbacc9aSKonstantin Sinyuk usleep_range((sleep_us >> 2) + 1, sleep_us); \ 136*8cbacc9aSKonstantin Sinyuk } \ 137*8cbacc9aSKonstantin Sinyuk (cond) ? 0 : -ETIMEDOUT; \ 138*8cbacc9aSKonstantin Sinyuk }) 139*8cbacc9aSKonstantin Sinyuk 140*8cbacc9aSKonstantin Sinyuk #ifdef CONFIG_HL_HLDIO 141*8cbacc9aSKonstantin Sinyuk bool hl_device_supports_nvme(struct hl_device *hdev); 142*8cbacc9aSKonstantin Sinyuk #else 143*8cbacc9aSKonstantin Sinyuk static inline bool hl_device_supports_nvme(struct hl_device *hdev) { return false; } 144*8cbacc9aSKonstantin Sinyuk #endif 145*8cbacc9aSKonstantin Sinyuk 146*8cbacc9aSKonstantin Sinyuk #endif /* __HL_HLDIO_H__ */ 147