1 /* 2 * Copyright 2016 Advanced Micro Devices, Inc. 3 * 4 * Permission is hereby granted, free of charge, to any person obtaining a 5 * copy of this software and associated documentation files (the "Software"), 6 * to deal in the Software without restriction, including without limitation 7 * the rights to use, copy, modify, merge, publish, distribute, sublicense, 8 * and/or sell copies of the Software, and to permit persons to whom the 9 * Software is furnished to do so, subject to the following conditions: 10 * 11 * The above copyright notice and this permission notice shall be included in 12 * all copies or substantial portions of the Software. 13 * 14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 15 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 16 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL 17 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR 18 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, 19 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR 20 * OTHER DEALINGS IN THE SOFTWARE. 21 * 22 */ 23 24 #ifndef __AMDGPU_TTM_H__ 25 #define __AMDGPU_TTM_H__ 26 27 #include <linux/dma-direction.h> 28 #include <drm/gpu_scheduler.h> 29 #include <drm/ttm/ttm_placement.h> 30 #include "amdgpu_vram_mgr.h" 31 #include "amdgpu_hmm.h" 32 #include "amdgpu_gmc.h" 33 34 #define AMDGPU_PL_GDS (TTM_PL_PRIV + 0) 35 #define AMDGPU_PL_GWS (TTM_PL_PRIV + 1) 36 #define AMDGPU_PL_OA (TTM_PL_PRIV + 2) 37 #define AMDGPU_PL_PREEMPT (TTM_PL_PRIV + 3) 38 #define AMDGPU_PL_DOORBELL (TTM_PL_PRIV + 4) 39 #define AMDGPU_PL_MMIO_REMAP (TTM_PL_PRIV + 5) 40 #define __AMDGPU_PL_NUM (TTM_PL_PRIV + 6) 41 42 #define AMDGPU_GTT_MAX_TRANSFER_SIZE 1024 43 44 extern const struct attribute_group amdgpu_vram_mgr_attr_group; 45 extern const struct attribute_group amdgpu_gtt_mgr_attr_group; 46 47 struct hmm_range; 48 49 struct amdgpu_gtt_mgr { 50 struct ttm_resource_manager manager; 51 struct drm_mm mm; 52 spinlock_t lock; 53 }; 54 55 struct amdgpu_ttm_buffer_entity { 56 struct drm_sched_entity base; 57 struct mutex lock; 58 struct drm_mm_node gart_node; 59 u64 gart_window_offs[2]; 60 }; 61 62 enum amdgpu_resv_region_id { 63 AMDGPU_RESV_STOLEN_VGA, 64 AMDGPU_RESV_STOLEN_EXTENDED, 65 AMDGPU_RESV_STOLEN_RESERVED, 66 AMDGPU_RESV_FW, 67 AMDGPU_RESV_FW_EXTEND, 68 AMDGPU_RESV_FW_VRAM_USAGE, 69 AMDGPU_RESV_DRV_VRAM_USAGE, 70 AMDGPU_RESV_MEM_TRAIN, 71 AMDGPU_RESV_MAX 72 }; 73 74 struct amdgpu_vram_resv { 75 uint64_t offset; 76 uint64_t size; 77 struct amdgpu_bo *bo; 78 void *cpu_ptr; 79 bool needs_cpu_map; 80 }; 81 82 struct amdgpu_mman { 83 struct ttm_device bdev; 84 struct ttm_pool *ttm_pools; 85 bool initialized; 86 void __iomem *aper_base_kaddr; 87 88 /* buffer handling */ 89 const struct amdgpu_buffer_funcs *buffer_funcs; 90 struct amdgpu_ring *buffer_funcs_ring; 91 bool buffer_funcs_enabled; 92 93 /* @default_entity: for workarounds, has no gart windows */ 94 struct amdgpu_ttm_buffer_entity default_entity; 95 struct amdgpu_ttm_buffer_entity *clear_entities; 96 atomic_t next_clear_entity; 97 u32 num_clear_entities; 98 struct amdgpu_ttm_buffer_entity move_entities[TTM_NUM_MOVE_FENCES]; 99 atomic_t next_move_entity; 100 u32 num_move_entities; 101 102 struct amdgpu_vram_mgr vram_mgr; 103 struct amdgpu_gtt_mgr gtt_mgr; 104 struct ttm_resource_manager preempt_mgr; 105 106 bool keep_stolen_vga_memory; 107 108 /* driver VRAM reservation */ 109 u64 drv_vram_usage_start_offset; 110 u64 drv_vram_usage_size; 111 struct amdgpu_bo *drv_vram_usage_reserved_bo; 112 void *drv_vram_usage_va; 113 114 struct amdgpu_vram_resv resv_region[AMDGPU_RESV_MAX]; 115 116 /* PAGE_SIZE'd BO for process memory r/w over SDMA. */ 117 struct amdgpu_bo *sdma_access_bo; 118 void *sdma_access_ptr; 119 }; 120 121 struct amdgpu_copy_mem { 122 struct ttm_buffer_object *bo; 123 struct ttm_resource *mem; 124 unsigned long offset; 125 }; 126 127 #define AMDGPU_COPY_FLAGS_TMZ (1 << 0) 128 #define AMDGPU_COPY_FLAGS_READ_DECOMPRESSED (1 << 1) 129 #define AMDGPU_COPY_FLAGS_WRITE_COMPRESSED (1 << 2) 130 #define AMDGPU_COPY_FLAGS_MAX_COMPRESSED_SHIFT 3 131 #define AMDGPU_COPY_FLAGS_MAX_COMPRESSED_MASK 0x03 132 #define AMDGPU_COPY_FLAGS_NUMBER_TYPE_SHIFT 5 133 #define AMDGPU_COPY_FLAGS_NUMBER_TYPE_MASK 0x07 134 #define AMDGPU_COPY_FLAGS_DATA_FORMAT_SHIFT 8 135 #define AMDGPU_COPY_FLAGS_DATA_FORMAT_MASK 0x3f 136 #define AMDGPU_COPY_FLAGS_WRITE_COMPRESS_DISABLE_SHIFT 14 137 #define AMDGPU_COPY_FLAGS_WRITE_COMPRESS_DISABLE_MASK 0x1 138 139 #define AMDGPU_COPY_FLAGS_SET(field, value) \ 140 (((__u32)(value) & AMDGPU_COPY_FLAGS_##field##_MASK) << AMDGPU_COPY_FLAGS_##field##_SHIFT) 141 #define AMDGPU_COPY_FLAGS_GET(value, field) \ 142 (((__u32)(value) >> AMDGPU_COPY_FLAGS_##field##_SHIFT) & AMDGPU_COPY_FLAGS_##field##_MASK) 143 144 int amdgpu_gtt_mgr_init(struct amdgpu_device *adev, uint64_t gtt_size); 145 void amdgpu_gtt_mgr_fini(struct amdgpu_device *adev); 146 int amdgpu_preempt_mgr_init(struct amdgpu_device *adev); 147 void amdgpu_preempt_mgr_fini(struct amdgpu_device *adev); 148 int amdgpu_vram_mgr_init(struct amdgpu_device *adev); 149 void amdgpu_vram_mgr_fini(struct amdgpu_device *adev); 150 151 bool amdgpu_gtt_mgr_has_gart_addr(struct ttm_resource *mem); 152 void amdgpu_gtt_mgr_recover(struct amdgpu_gtt_mgr *mgr); 153 154 int amdgpu_gtt_mgr_alloc_entries(struct amdgpu_gtt_mgr *mgr, 155 struct drm_mm_node *mm_node, 156 u64 num_pages, 157 enum drm_mm_insert_mode mode); 158 void amdgpu_gtt_mgr_free_entries(struct amdgpu_gtt_mgr *mgr, 159 struct drm_mm_node *mm_node); 160 uint64_t amdgpu_preempt_mgr_usage(struct ttm_resource_manager *man); 161 162 u64 amdgpu_vram_mgr_bo_visible_size(struct amdgpu_bo *bo); 163 int amdgpu_vram_mgr_alloc_sgt(struct amdgpu_device *adev, 164 struct ttm_resource *mem, 165 u64 offset, u64 size, 166 struct device *dev, 167 enum dma_data_direction dir, 168 struct sg_table **sgt); 169 void amdgpu_vram_mgr_free_sgt(struct device *dev, 170 enum dma_data_direction dir, 171 struct sg_table *sgt); 172 uint64_t amdgpu_vram_mgr_vis_usage(struct amdgpu_vram_mgr *mgr); 173 int amdgpu_vram_mgr_reserve_range(struct amdgpu_vram_mgr *mgr, 174 uint64_t start, uint64_t size); 175 int amdgpu_vram_mgr_query_page_status(struct amdgpu_vram_mgr *mgr, 176 uint64_t start); 177 void amdgpu_vram_mgr_clear_reset_blocks(struct amdgpu_device *adev); 178 179 bool amdgpu_res_cpu_visible(struct amdgpu_device *adev, 180 struct ttm_resource *res); 181 182 void amdgpu_ttm_init_vram_resv(struct amdgpu_device *adev, 183 enum amdgpu_resv_region_id id, 184 uint64_t offset, uint64_t size, 185 bool needs_cpu_map); 186 int amdgpu_ttm_mark_vram_reserved(struct amdgpu_device *adev, 187 enum amdgpu_resv_region_id id); 188 void amdgpu_ttm_unmark_vram_reserved(struct amdgpu_device *adev, 189 enum amdgpu_resv_region_id id); 190 191 int amdgpu_ttm_init(struct amdgpu_device *adev); 192 void amdgpu_ttm_fini(struct amdgpu_device *adev); 193 void amdgpu_ttm_set_buffer_funcs_status(struct amdgpu_device *adev, 194 bool enable); 195 int amdgpu_copy_buffer(struct amdgpu_device *adev, 196 struct amdgpu_ttm_buffer_entity *entity, 197 uint64_t src_offset, 198 uint64_t dst_offset, uint32_t byte_count, 199 struct dma_resv *resv, 200 struct dma_fence **fence, 201 bool vm_needs_flush, uint32_t copy_flags); 202 int amdgpu_ttm_clear_buffer(struct amdgpu_bo *bo, 203 struct dma_resv *resv, 204 struct dma_fence **fence); 205 int amdgpu_fill_buffer(struct amdgpu_ttm_buffer_entity *entity, 206 struct amdgpu_bo *bo, 207 uint32_t src_data, 208 struct dma_resv *resv, 209 struct dma_fence **f, 210 u64 k_job_id); 211 struct amdgpu_ttm_buffer_entity *amdgpu_ttm_next_clear_entity(struct amdgpu_device *adev); 212 213 int amdgpu_ttm_alloc_gart(struct ttm_buffer_object *bo); 214 void amdgpu_ttm_recover_gart(struct ttm_buffer_object *tbo); 215 uint64_t amdgpu_ttm_domain_start(struct amdgpu_device *adev, uint32_t type); 216 217 #if IS_ENABLED(CONFIG_DRM_AMDGPU_USERPTR) 218 int amdgpu_ttm_tt_get_user_pages(struct amdgpu_bo *bo, 219 struct amdgpu_hmm_range *range); 220 #else 221 static inline int amdgpu_ttm_tt_get_user_pages(struct amdgpu_bo *bo, 222 struct amdgpu_hmm_range *range) 223 { 224 return -EPERM; 225 } 226 #endif 227 228 /** 229 * amdgpu_compute_gart_address() - Returns GART address of an entity's window 230 * @gmc: The &struct amdgpu_gmc instance to use 231 * @entity: The &struct amdgpu_ttm_buffer_entity owning the GART window 232 * @index: The window to use (must be 0 or 1) 233 */ 234 static inline u64 amdgpu_compute_gart_address(struct amdgpu_gmc *gmc, 235 struct amdgpu_ttm_buffer_entity *entity, 236 int index) 237 { 238 return gmc->gart_start + entity->gart_window_offs[index]; 239 } 240 241 /** 242 * amdgpu_gtt_node_to_byte_offset() - Returns a byte offset of a gtt node 243 */ 244 static inline u64 amdgpu_gtt_node_to_byte_offset(const struct drm_mm_node *gtt_node) 245 { 246 return gtt_node->start * (u64)PAGE_SIZE; 247 } 248 249 void amdgpu_ttm_tt_set_user_pages(struct ttm_tt *ttm, struct amdgpu_hmm_range *range); 250 int amdgpu_ttm_tt_get_userptr(const struct ttm_buffer_object *tbo, 251 uint64_t *user_addr); 252 int amdgpu_ttm_tt_set_userptr(struct ttm_buffer_object *bo, 253 uint64_t addr, uint32_t flags); 254 bool amdgpu_ttm_tt_has_userptr(struct ttm_tt *ttm); 255 struct mm_struct *amdgpu_ttm_tt_get_usermm(struct ttm_tt *ttm); 256 bool amdgpu_ttm_tt_affect_userptr(struct ttm_tt *ttm, unsigned long start, 257 unsigned long end, unsigned long *userptr); 258 bool amdgpu_ttm_tt_userptr_invalidated(struct ttm_tt *ttm, 259 int *last_invalidated); 260 bool amdgpu_ttm_tt_is_userptr(struct ttm_tt *ttm); 261 bool amdgpu_ttm_tt_is_readonly(struct ttm_tt *ttm); 262 uint64_t amdgpu_ttm_tt_pde_flags(struct ttm_tt *ttm, struct ttm_resource *mem); 263 uint64_t amdgpu_ttm_tt_pte_flags(struct amdgpu_device *adev, struct ttm_tt *ttm, 264 struct ttm_resource *mem); 265 int amdgpu_ttm_evict_resources(struct amdgpu_device *adev, int mem_type); 266 267 void amdgpu_ttm_debugfs_init(struct amdgpu_device *adev); 268 269 int amdgpu_ttm_mmio_remap_alloc_sgt(struct amdgpu_device *adev, 270 struct ttm_resource *res, 271 struct device *dev, 272 enum dma_data_direction dir, 273 struct sg_table **sgt); 274 void amdgpu_ttm_mmio_remap_free_sgt(struct device *dev, 275 enum dma_data_direction dir, 276 struct sg_table *sgt); 277 278 #endif 279