xref: /linux/drivers/gpu/drm/amd/amdgpu/amdgpu_gem.c (revision c7062be3380cb20c8b1c4a935a13f1848ead0719)
1 /*
2  * Copyright 2008 Advanced Micro Devices, Inc.
3  * Copyright 2008 Red Hat Inc.
4  * Copyright 2009 Jerome Glisse.
5  *
6  * Permission is hereby granted, free of charge, to any person obtaining a
7  * copy of this software and associated documentation files (the "Software"),
8  * to deal in the Software without restriction, including without limitation
9  * the rights to use, copy, modify, merge, publish, distribute, sublicense,
10  * and/or sell copies of the Software, and to permit persons to whom the
11  * Software is furnished to do so, subject to the following conditions:
12  *
13  * The above copyright notice and this permission notice shall be included in
14  * all copies or substantial portions of the Software.
15  *
16  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
19  * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
20  * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
21  * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
22  * OTHER DEALINGS IN THE SOFTWARE.
23  *
24  * Authors: Dave Airlie
25  *          Alex Deucher
26  *          Jerome Glisse
27  */
28 #include <linux/ktime.h>
29 #include <linux/module.h>
30 #include <linux/pagemap.h>
31 #include <linux/pci.h>
32 #include <linux/dma-buf.h>
33 
34 #include <drm/amdgpu_drm.h>
35 #include <drm/drm_drv.h>
36 #include <drm/drm_exec.h>
37 #include <drm/drm_gem_ttm_helper.h>
38 #include <drm/ttm/ttm_tt.h>
39 #include <drm/drm_syncobj.h>
40 
41 #include "amdgpu.h"
42 #include "amdgpu_display.h"
43 #include "amdgpu_dma_buf.h"
44 #include "amdgpu_hmm.h"
45 #include "amdgpu_xgmi.h"
46 #include "amdgpu_vm.h"
47 
48 static int
49 amdgpu_gem_add_input_fence(struct drm_file *filp,
50 			   uint64_t syncobj_handles_array,
51 			   uint32_t num_syncobj_handles)
52 {
53 	struct dma_fence *fence;
54 	uint32_t *syncobj_handles;
55 	int ret, i;
56 
57 	if (!num_syncobj_handles)
58 		return 0;
59 
60 	syncobj_handles = memdup_user(u64_to_user_ptr(syncobj_handles_array),
61 				      size_mul(sizeof(uint32_t), num_syncobj_handles));
62 	if (IS_ERR(syncobj_handles))
63 		return PTR_ERR(syncobj_handles);
64 
65 	for (i = 0; i < num_syncobj_handles; i++) {
66 
67 		if (!syncobj_handles[i]) {
68 			ret = -EINVAL;
69 			goto free_memdup;
70 		}
71 
72 		ret = drm_syncobj_find_fence(filp, syncobj_handles[i], 0, 0, &fence);
73 		if (ret)
74 			goto free_memdup;
75 
76 		dma_fence_wait(fence, false);
77 
78 		/* TODO: optimize async handling */
79 		dma_fence_put(fence);
80 	}
81 
82 free_memdup:
83 	kfree(syncobj_handles);
84 	return ret;
85 }
86 
87 static int
88 amdgpu_gem_update_timeline_node(struct drm_file *filp,
89 				uint32_t syncobj_handle,
90 				uint64_t point,
91 				struct drm_syncobj **syncobj,
92 				struct dma_fence_chain **chain)
93 {
94 	if (!syncobj_handle)
95 		return 0;
96 
97 	/* Find the sync object */
98 	*syncobj = drm_syncobj_find(filp, syncobj_handle);
99 	if (!*syncobj)
100 		return -ENOENT;
101 
102 	if (!point)
103 		return 0;
104 
105 	/* Allocate the chain node */
106 	*chain = dma_fence_chain_alloc();
107 	if (!*chain) {
108 		drm_syncobj_put(*syncobj);
109 		return -ENOMEM;
110 	}
111 
112 	return 0;
113 }
114 
115 static void
116 amdgpu_gem_update_bo_mapping(struct drm_file *filp,
117 			     struct amdgpu_bo_va *bo_va,
118 			     uint32_t operation,
119 			     uint64_t point,
120 			     struct dma_fence *fence,
121 			     struct drm_syncobj *syncobj,
122 			     struct dma_fence_chain *chain)
123 {
124 	struct amdgpu_bo *bo = bo_va ? bo_va->base.bo : NULL;
125 	struct amdgpu_fpriv *fpriv = filp->driver_priv;
126 	struct amdgpu_vm *vm = &fpriv->vm;
127 	struct dma_fence *last_update;
128 
129 	if (!syncobj)
130 		return;
131 
132 	/* Find the last update fence */
133 	switch (operation) {
134 	case AMDGPU_VA_OP_MAP:
135 	case AMDGPU_VA_OP_REPLACE:
136 		if (bo && (bo->tbo.base.resv == vm->root.bo->tbo.base.resv))
137 			last_update = vm->last_update;
138 		else
139 			last_update = bo_va->last_pt_update;
140 		break;
141 	case AMDGPU_VA_OP_UNMAP:
142 	case AMDGPU_VA_OP_CLEAR:
143 		last_update = fence;
144 		break;
145 	default:
146 		return;
147 	}
148 
149 	/* Add fence to timeline */
150 	if (!point)
151 		drm_syncobj_replace_fence(syncobj, last_update);
152 	else
153 		drm_syncobj_add_point(syncobj, chain, last_update, point);
154 }
155 
156 static vm_fault_t amdgpu_gem_fault(struct vm_fault *vmf)
157 {
158 	struct ttm_buffer_object *bo = vmf->vma->vm_private_data;
159 	struct drm_device *ddev = bo->base.dev;
160 	vm_fault_t ret;
161 	int idx;
162 
163 	ret = ttm_bo_vm_reserve(bo, vmf);
164 	if (ret)
165 		return ret;
166 
167 	if (drm_dev_enter(ddev, &idx)) {
168 		ret = amdgpu_bo_fault_reserve_notify(bo);
169 		if (ret) {
170 			drm_dev_exit(idx);
171 			goto unlock;
172 		}
173 
174 		ret = ttm_bo_vm_fault_reserved(vmf, vmf->vma->vm_page_prot,
175 					       TTM_BO_VM_NUM_PREFAULT);
176 
177 		drm_dev_exit(idx);
178 	} else {
179 		ret = ttm_bo_vm_dummy_page(vmf, vmf->vma->vm_page_prot);
180 	}
181 	if (ret == VM_FAULT_RETRY && !(vmf->flags & FAULT_FLAG_RETRY_NOWAIT))
182 		return ret;
183 
184 unlock:
185 	dma_resv_unlock(bo->base.resv);
186 	return ret;
187 }
188 
189 static const struct vm_operations_struct amdgpu_gem_vm_ops = {
190 	.fault = amdgpu_gem_fault,
191 	.open = ttm_bo_vm_open,
192 	.close = ttm_bo_vm_close,
193 	.access = ttm_bo_vm_access
194 };
195 
196 static void amdgpu_gem_object_free(struct drm_gem_object *gobj)
197 {
198 	struct amdgpu_bo *aobj = gem_to_amdgpu_bo(gobj);
199 
200 	amdgpu_hmm_unregister(aobj);
201 	ttm_bo_fini(&aobj->tbo);
202 }
203 
204 int amdgpu_gem_object_create(struct amdgpu_device *adev, unsigned long size,
205 			     int alignment, u32 initial_domain,
206 			     u64 flags, enum ttm_bo_type type,
207 			     struct dma_resv *resv,
208 			     struct drm_gem_object **obj, int8_t xcp_id_plus1)
209 {
210 	struct amdgpu_bo *bo;
211 	struct amdgpu_bo_user *ubo;
212 	struct amdgpu_bo_param bp;
213 	int r;
214 
215 	memset(&bp, 0, sizeof(bp));
216 	*obj = NULL;
217 	flags |= AMDGPU_GEM_CREATE_VRAM_WIPE_ON_RELEASE;
218 
219 	bp.size = size;
220 	bp.byte_align = alignment;
221 	bp.type = type;
222 	bp.resv = resv;
223 	bp.preferred_domain = initial_domain;
224 	bp.flags = flags;
225 	bp.domain = initial_domain;
226 	bp.bo_ptr_size = sizeof(struct amdgpu_bo);
227 	bp.xcp_id_plus1 = xcp_id_plus1;
228 
229 	r = amdgpu_bo_create_user(adev, &bp, &ubo);
230 	if (r)
231 		return r;
232 
233 	bo = &ubo->bo;
234 	*obj = &bo->tbo.base;
235 
236 	return 0;
237 }
238 
239 void amdgpu_gem_force_release(struct amdgpu_device *adev)
240 {
241 	struct drm_device *ddev = adev_to_drm(adev);
242 	struct drm_file *file;
243 
244 	mutex_lock(&ddev->filelist_mutex);
245 
246 	list_for_each_entry(file, &ddev->filelist, lhead) {
247 		struct drm_gem_object *gobj;
248 		int handle;
249 
250 		WARN_ONCE(1, "Still active user space clients!\n");
251 		spin_lock(&file->table_lock);
252 		idr_for_each_entry(&file->object_idr, gobj, handle) {
253 			WARN_ONCE(1, "And also active allocations!\n");
254 			drm_gem_object_put(gobj);
255 		}
256 		idr_destroy(&file->object_idr);
257 		spin_unlock(&file->table_lock);
258 	}
259 
260 	mutex_unlock(&ddev->filelist_mutex);
261 }
262 
263 /*
264  * Call from drm_gem_handle_create which appear in both new and open ioctl
265  * case.
266  */
267 static int amdgpu_gem_object_open(struct drm_gem_object *obj,
268 				  struct drm_file *file_priv)
269 {
270 	struct amdgpu_bo *abo = gem_to_amdgpu_bo(obj);
271 	struct amdgpu_device *adev = amdgpu_ttm_adev(abo->tbo.bdev);
272 	struct amdgpu_fpriv *fpriv = file_priv->driver_priv;
273 	struct amdgpu_vm *vm = &fpriv->vm;
274 	struct amdgpu_bo_va *bo_va;
275 	struct mm_struct *mm;
276 	int r;
277 
278 	mm = amdgpu_ttm_tt_get_usermm(abo->tbo.ttm);
279 	if (mm && mm != current->mm)
280 		return -EPERM;
281 
282 	if (abo->flags & AMDGPU_GEM_CREATE_VM_ALWAYS_VALID &&
283 	    !amdgpu_vm_is_bo_always_valid(vm, abo))
284 		return -EPERM;
285 
286 	r = amdgpu_bo_reserve(abo, false);
287 	if (r)
288 		return r;
289 
290 	amdgpu_vm_bo_update_shared(abo);
291 	bo_va = amdgpu_vm_bo_find(vm, abo);
292 	if (!bo_va)
293 		bo_va = amdgpu_vm_bo_add(adev, vm, abo);
294 	else
295 		++bo_va->ref_count;
296 
297 	/* attach gfx eviction fence */
298 	r = amdgpu_eviction_fence_attach(&fpriv->evf_mgr, abo);
299 	if (r) {
300 		DRM_DEBUG_DRIVER("Failed to attach eviction fence to BO\n");
301 		amdgpu_bo_unreserve(abo);
302 		return r;
303 	}
304 
305 	amdgpu_bo_unreserve(abo);
306 
307 	/* Validate and add eviction fence to DMABuf imports with dynamic
308 	 * attachment in compute VMs. Re-validation will be done by
309 	 * amdgpu_vm_validate. Fences are on the reservation shared with the
310 	 * export, which is currently required to be validated and fenced
311 	 * already by amdgpu_amdkfd_gpuvm_restore_process_bos.
312 	 *
313 	 * Nested locking below for the case that a GEM object is opened in
314 	 * kfd_mem_export_dmabuf. Since the lock below is only taken for imports,
315 	 * but not for export, this is a different lock class that cannot lead to
316 	 * circular lock dependencies.
317 	 */
318 	if (!vm->is_compute_context || !vm->process_info)
319 		return 0;
320 	if (!drm_gem_is_imported(obj) ||
321 	    !dma_buf_is_dynamic(obj->import_attach->dmabuf))
322 		return 0;
323 	mutex_lock_nested(&vm->process_info->lock, 1);
324 	if (!WARN_ON(!vm->process_info->eviction_fence)) {
325 		r = amdgpu_amdkfd_bo_validate_and_fence(abo, AMDGPU_GEM_DOMAIN_GTT,
326 							&vm->process_info->eviction_fence->base);
327 		if (r) {
328 			struct amdgpu_task_info *ti = amdgpu_vm_get_task_info_vm(vm);
329 
330 			dev_warn(adev->dev, "validate_and_fence failed: %d\n", r);
331 			if (ti) {
332 				dev_warn(adev->dev, "pid %d\n", ti->task.pid);
333 				amdgpu_vm_put_task_info(ti);
334 			}
335 		}
336 	}
337 	mutex_unlock(&vm->process_info->lock);
338 
339 	return r;
340 }
341 
342 static void amdgpu_gem_object_close(struct drm_gem_object *obj,
343 				    struct drm_file *file_priv)
344 {
345 	struct amdgpu_bo *bo = gem_to_amdgpu_bo(obj);
346 	struct amdgpu_device *adev = amdgpu_ttm_adev(bo->tbo.bdev);
347 	struct amdgpu_fpriv *fpriv = file_priv->driver_priv;
348 	struct amdgpu_vm *vm = &fpriv->vm;
349 
350 	struct dma_fence *fence = NULL;
351 	struct amdgpu_bo_va *bo_va;
352 	struct drm_exec exec;
353 	long r;
354 
355 	drm_exec_init(&exec, DRM_EXEC_IGNORE_DUPLICATES, 0);
356 	drm_exec_until_all_locked(&exec) {
357 		r = drm_exec_prepare_obj(&exec, &bo->tbo.base, 1);
358 		drm_exec_retry_on_contention(&exec);
359 		if (unlikely(r))
360 			goto out_unlock;
361 
362 		r = amdgpu_vm_lock_pd(vm, &exec, 0);
363 		drm_exec_retry_on_contention(&exec);
364 		if (unlikely(r))
365 			goto out_unlock;
366 	}
367 
368 	if (!amdgpu_vm_is_bo_always_valid(vm, bo))
369 		amdgpu_eviction_fence_detach(&fpriv->evf_mgr, bo);
370 
371 	bo_va = amdgpu_vm_bo_find(vm, bo);
372 	if (!bo_va || --bo_va->ref_count)
373 		goto out_unlock;
374 
375 	amdgpu_vm_bo_del(adev, bo_va);
376 	amdgpu_vm_bo_update_shared(bo);
377 	if (!amdgpu_vm_ready(vm))
378 		goto out_unlock;
379 
380 	r = amdgpu_vm_clear_freed(adev, vm, &fence);
381 	if (unlikely(r < 0))
382 		dev_err(adev->dev, "failed to clear page "
383 			"tables on GEM object close (%ld)\n", r);
384 	if (r || !fence)
385 		goto out_unlock;
386 
387 	amdgpu_bo_fence(bo, fence, true);
388 	dma_fence_put(fence);
389 
390 out_unlock:
391 	if (r)
392 		dev_err(adev->dev, "leaking bo va (%ld)\n", r);
393 	drm_exec_fini(&exec);
394 }
395 
396 static int amdgpu_gem_object_mmap(struct drm_gem_object *obj, struct vm_area_struct *vma)
397 {
398 	struct amdgpu_bo *bo = gem_to_amdgpu_bo(obj);
399 
400 	if (amdgpu_ttm_tt_get_usermm(bo->tbo.ttm))
401 		return -EPERM;
402 	if (bo->flags & AMDGPU_GEM_CREATE_NO_CPU_ACCESS)
403 		return -EPERM;
404 
405 	/* Workaround for Thunk bug creating PROT_NONE,MAP_PRIVATE mappings
406 	 * for debugger access to invisible VRAM. Should have used MAP_SHARED
407 	 * instead. Clearing VM_MAYWRITE prevents the mapping from ever
408 	 * becoming writable and makes is_cow_mapping(vm_flags) false.
409 	 */
410 	if (is_cow_mapping(vma->vm_flags) &&
411 	    !(vma->vm_flags & VM_ACCESS_FLAGS))
412 		vm_flags_clear(vma, VM_MAYWRITE);
413 
414 	return drm_gem_ttm_mmap(obj, vma);
415 }
416 
417 const struct drm_gem_object_funcs amdgpu_gem_object_funcs = {
418 	.free = amdgpu_gem_object_free,
419 	.open = amdgpu_gem_object_open,
420 	.close = amdgpu_gem_object_close,
421 	.export = amdgpu_gem_prime_export,
422 	.vmap = drm_gem_ttm_vmap,
423 	.vunmap = drm_gem_ttm_vunmap,
424 	.mmap = amdgpu_gem_object_mmap,
425 	.vm_ops = &amdgpu_gem_vm_ops,
426 };
427 
428 /*
429  * GEM ioctls.
430  */
431 int amdgpu_gem_create_ioctl(struct drm_device *dev, void *data,
432 			    struct drm_file *filp)
433 {
434 	struct amdgpu_device *adev = drm_to_adev(dev);
435 	struct amdgpu_fpriv *fpriv = filp->driver_priv;
436 	struct amdgpu_vm *vm = &fpriv->vm;
437 	union drm_amdgpu_gem_create *args = data;
438 	uint64_t flags = args->in.domain_flags;
439 	uint64_t size = args->in.bo_size;
440 	struct dma_resv *resv = NULL;
441 	struct drm_gem_object *gobj;
442 	uint32_t handle, initial_domain;
443 	int r;
444 
445 	/* reject invalid gem flags */
446 	if (flags & ~AMDGPU_GEM_CREATE_SETTABLE_MASK)
447 		return -EINVAL;
448 
449 	/* reject invalid gem domains */
450 	if (args->in.domains & ~AMDGPU_GEM_DOMAIN_MASK)
451 		return -EINVAL;
452 
453 	if (!amdgpu_is_tmz(adev) && (flags & AMDGPU_GEM_CREATE_ENCRYPTED)) {
454 		DRM_NOTE_ONCE("Cannot allocate secure buffer since TMZ is disabled\n");
455 		return -EINVAL;
456 	}
457 
458 	/* always clear VRAM */
459 	flags |= AMDGPU_GEM_CREATE_VRAM_CLEARED;
460 
461 	if (args->in.domains & AMDGPU_GEM_DOMAIN_MMIO_REMAP)
462 		return -EINVAL;
463 
464 	/* create a gem object to contain this object in */
465 	if (args->in.domains & (AMDGPU_GEM_DOMAIN_GDS |
466 	    AMDGPU_GEM_DOMAIN_GWS | AMDGPU_GEM_DOMAIN_OA)) {
467 		if (flags & AMDGPU_GEM_CREATE_VM_ALWAYS_VALID) {
468 			/* if gds bo is created from user space, it must be
469 			 * passed to bo list
470 			 */
471 			DRM_ERROR("GDS bo cannot be per-vm-bo\n");
472 			return -EINVAL;
473 		}
474 		flags |= AMDGPU_GEM_CREATE_NO_CPU_ACCESS;
475 	}
476 
477 	if (flags & AMDGPU_GEM_CREATE_VM_ALWAYS_VALID) {
478 		r = amdgpu_bo_reserve(vm->root.bo, false);
479 		if (r)
480 			return r;
481 
482 		resv = vm->root.bo->tbo.base.resv;
483 	}
484 
485 	initial_domain = (u32)(0xffffffff & args->in.domains);
486 retry:
487 	r = amdgpu_gem_object_create(adev, size, args->in.alignment,
488 				     initial_domain,
489 				     flags, ttm_bo_type_device, resv, &gobj, fpriv->xcp_id + 1);
490 	if (r && r != -ERESTARTSYS) {
491 		if (flags & AMDGPU_GEM_CREATE_CPU_ACCESS_REQUIRED) {
492 			flags &= ~AMDGPU_GEM_CREATE_CPU_ACCESS_REQUIRED;
493 			goto retry;
494 		}
495 
496 		if (initial_domain == AMDGPU_GEM_DOMAIN_VRAM) {
497 			initial_domain |= AMDGPU_GEM_DOMAIN_GTT;
498 			goto retry;
499 		}
500 		DRM_DEBUG("Failed to allocate GEM object (%llu, %d, %llu, %d)\n",
501 				size, initial_domain, args->in.alignment, r);
502 	}
503 
504 	if (flags & AMDGPU_GEM_CREATE_VM_ALWAYS_VALID) {
505 		if (!r) {
506 			struct amdgpu_bo *abo = gem_to_amdgpu_bo(gobj);
507 
508 			abo->parent = amdgpu_bo_ref(vm->root.bo);
509 		}
510 		amdgpu_bo_unreserve(vm->root.bo);
511 	}
512 	if (r)
513 		return r;
514 
515 	r = drm_gem_handle_create(filp, gobj, &handle);
516 	/* drop reference from allocate - handle holds it now */
517 	drm_gem_object_put(gobj);
518 	if (r)
519 		return r;
520 
521 	memset(args, 0, sizeof(*args));
522 	args->out.handle = handle;
523 	return 0;
524 }
525 
526 int amdgpu_gem_userptr_ioctl(struct drm_device *dev, void *data,
527 			     struct drm_file *filp)
528 {
529 	struct ttm_operation_ctx ctx = { true, false };
530 	struct amdgpu_device *adev = drm_to_adev(dev);
531 	struct drm_amdgpu_gem_userptr *args = data;
532 	struct amdgpu_fpriv *fpriv = filp->driver_priv;
533 	struct drm_gem_object *gobj;
534 	struct amdgpu_hmm_range *range;
535 	struct amdgpu_bo *bo;
536 	uint32_t handle;
537 	int r;
538 
539 	args->addr = untagged_addr(args->addr);
540 
541 	if (offset_in_page(args->addr | args->size))
542 		return -EINVAL;
543 
544 	/* reject unknown flag values */
545 	if (args->flags & ~(AMDGPU_GEM_USERPTR_READONLY |
546 	    AMDGPU_GEM_USERPTR_ANONONLY | AMDGPU_GEM_USERPTR_VALIDATE |
547 	    AMDGPU_GEM_USERPTR_REGISTER))
548 		return -EINVAL;
549 
550 	if (!(args->flags & AMDGPU_GEM_USERPTR_READONLY) &&
551 	     !(args->flags & AMDGPU_GEM_USERPTR_REGISTER)) {
552 
553 		/* if we want to write to it we must install a MMU notifier */
554 		return -EACCES;
555 	}
556 
557 	/* create a gem object to contain this object in */
558 	r = amdgpu_gem_object_create(adev, args->size, 0, AMDGPU_GEM_DOMAIN_CPU,
559 				     0, ttm_bo_type_device, NULL, &gobj, fpriv->xcp_id + 1);
560 	if (r)
561 		return r;
562 
563 	bo = gem_to_amdgpu_bo(gobj);
564 	bo->preferred_domains = AMDGPU_GEM_DOMAIN_GTT;
565 	bo->allowed_domains = AMDGPU_GEM_DOMAIN_GTT;
566 	r = amdgpu_ttm_tt_set_userptr(&bo->tbo, args->addr, args->flags);
567 	if (r)
568 		goto release_object;
569 
570 	r = amdgpu_hmm_register(bo, args->addr);
571 	if (r)
572 		goto release_object;
573 
574 	if (args->flags & AMDGPU_GEM_USERPTR_VALIDATE) {
575 		range = amdgpu_hmm_range_alloc(NULL);
576 		if (unlikely(!range))
577 			return -ENOMEM;
578 		r = amdgpu_ttm_tt_get_user_pages(bo, range);
579 		if (r) {
580 			amdgpu_hmm_range_free(range);
581 			goto release_object;
582 		}
583 		r = amdgpu_bo_reserve(bo, true);
584 		if (r)
585 			goto user_pages_done;
586 
587 		amdgpu_ttm_tt_set_user_pages(bo->tbo.ttm, range);
588 
589 		amdgpu_bo_placement_from_domain(bo, AMDGPU_GEM_DOMAIN_GTT);
590 		r = ttm_bo_validate(&bo->tbo, &bo->placement, &ctx);
591 		amdgpu_bo_unreserve(bo);
592 		if (r)
593 			goto user_pages_done;
594 	}
595 
596 	r = drm_gem_handle_create(filp, gobj, &handle);
597 	if (r)
598 		goto user_pages_done;
599 
600 	args->handle = handle;
601 
602 user_pages_done:
603 	if (args->flags & AMDGPU_GEM_USERPTR_VALIDATE)
604 		amdgpu_hmm_range_free(range);
605 release_object:
606 	drm_gem_object_put(gobj);
607 
608 	return r;
609 }
610 
611 int amdgpu_mode_dumb_mmap(struct drm_file *filp,
612 			  struct drm_device *dev,
613 			  uint32_t handle, uint64_t *offset_p)
614 {
615 	struct drm_gem_object *gobj;
616 	struct amdgpu_bo *robj;
617 
618 	gobj = drm_gem_object_lookup(filp, handle);
619 	if (!gobj)
620 		return -ENOENT;
621 
622 	robj = gem_to_amdgpu_bo(gobj);
623 	if (amdgpu_ttm_tt_get_usermm(robj->tbo.ttm) ||
624 	    (robj->flags & AMDGPU_GEM_CREATE_NO_CPU_ACCESS)) {
625 		drm_gem_object_put(gobj);
626 		return -EPERM;
627 	}
628 	*offset_p = amdgpu_bo_mmap_offset(robj);
629 	drm_gem_object_put(gobj);
630 	return 0;
631 }
632 
633 int amdgpu_gem_mmap_ioctl(struct drm_device *dev, void *data,
634 			  struct drm_file *filp)
635 {
636 	union drm_amdgpu_gem_mmap *args = data;
637 	uint32_t handle = args->in.handle;
638 
639 	memset(args, 0, sizeof(*args));
640 	return amdgpu_mode_dumb_mmap(filp, dev, handle, &args->out.addr_ptr);
641 }
642 
643 /**
644  * amdgpu_gem_timeout - calculate jiffies timeout from absolute value
645  *
646  * @timeout_ns: timeout in ns
647  *
648  * Calculate the timeout in jiffies from an absolute timeout in ns.
649  */
650 unsigned long amdgpu_gem_timeout(uint64_t timeout_ns)
651 {
652 	unsigned long timeout_jiffies;
653 	ktime_t timeout;
654 
655 	/* clamp timeout if it's to large */
656 	if (((int64_t)timeout_ns) < 0)
657 		return MAX_SCHEDULE_TIMEOUT;
658 
659 	timeout = ktime_sub(ns_to_ktime(timeout_ns), ktime_get());
660 	if (ktime_to_ns(timeout) < 0)
661 		return 0;
662 
663 	timeout_jiffies = nsecs_to_jiffies(ktime_to_ns(timeout));
664 	/*  clamp timeout to avoid unsigned-> signed overflow */
665 	if (timeout_jiffies > MAX_SCHEDULE_TIMEOUT)
666 		return MAX_SCHEDULE_TIMEOUT - 1;
667 
668 	return timeout_jiffies;
669 }
670 
671 int amdgpu_gem_wait_idle_ioctl(struct drm_device *dev, void *data,
672 			      struct drm_file *filp)
673 {
674 	union drm_amdgpu_gem_wait_idle *args = data;
675 	struct drm_gem_object *gobj;
676 	struct amdgpu_bo *robj;
677 	uint32_t handle = args->in.handle;
678 	unsigned long timeout = amdgpu_gem_timeout(args->in.timeout);
679 	int r = 0;
680 	long ret;
681 
682 	gobj = drm_gem_object_lookup(filp, handle);
683 	if (!gobj)
684 		return -ENOENT;
685 
686 	robj = gem_to_amdgpu_bo(gobj);
687 	ret = dma_resv_wait_timeout(robj->tbo.base.resv, DMA_RESV_USAGE_READ,
688 				    true, timeout);
689 
690 	/* ret == 0 means not signaled,
691 	 * ret > 0 means signaled
692 	 * ret < 0 means interrupted before timeout
693 	 */
694 	if (ret >= 0) {
695 		memset(args, 0, sizeof(*args));
696 		args->out.status = (ret == 0);
697 	} else
698 		r = ret;
699 
700 	drm_gem_object_put(gobj);
701 	return r;
702 }
703 
704 int amdgpu_gem_metadata_ioctl(struct drm_device *dev, void *data,
705 				struct drm_file *filp)
706 {
707 	struct drm_amdgpu_gem_metadata *args = data;
708 	struct drm_gem_object *gobj;
709 	struct amdgpu_bo *robj;
710 	int r = -1;
711 
712 	DRM_DEBUG("%d\n", args->handle);
713 	gobj = drm_gem_object_lookup(filp, args->handle);
714 	if (gobj == NULL)
715 		return -ENOENT;
716 	robj = gem_to_amdgpu_bo(gobj);
717 
718 	r = amdgpu_bo_reserve(robj, false);
719 	if (unlikely(r != 0))
720 		goto out;
721 
722 	/* Reject MMIO_REMAP BOs at IOCTL level: metadata/tiling does not apply. */
723 	if (robj->tbo.resource &&
724 	    robj->tbo.resource->mem_type == AMDGPU_PL_MMIO_REMAP) {
725 		DRM_WARN("metadata ioctl on MMIO_REMAP BO (handle %d)\n",
726 			 args->handle);
727 		r = -EINVAL;
728 		goto unreserve;
729 	}
730 
731 	if (args->op == AMDGPU_GEM_METADATA_OP_GET_METADATA) {
732 		amdgpu_bo_get_tiling_flags(robj, &args->data.tiling_info);
733 		r = amdgpu_bo_get_metadata(robj, args->data.data,
734 					   sizeof(args->data.data),
735 					   &args->data.data_size_bytes,
736 					   &args->data.flags);
737 	} else if (args->op == AMDGPU_GEM_METADATA_OP_SET_METADATA) {
738 		if (args->data.data_size_bytes > sizeof(args->data.data)) {
739 			r = -EINVAL;
740 			goto unreserve;
741 		}
742 		r = amdgpu_bo_set_tiling_flags(robj, args->data.tiling_info);
743 		if (!r)
744 			r = amdgpu_bo_set_metadata(robj, args->data.data,
745 						   args->data.data_size_bytes,
746 						   args->data.flags);
747 	}
748 
749 unreserve:
750 	amdgpu_bo_unreserve(robj);
751 out:
752 	drm_gem_object_put(gobj);
753 	return r;
754 }
755 
756 /**
757  * amdgpu_gem_va_update_vm -update the bo_va in its VM
758  *
759  * @adev: amdgpu_device pointer
760  * @vm: vm to update
761  * @bo_va: bo_va to update
762  * @operation: map, unmap or clear
763  *
764  * Update the bo_va directly after setting its address. Errors are not
765  * vital here, so they are not reported back to userspace.
766  *
767  * Returns resulting fence if freed BO(s) got cleared from the PT.
768  * otherwise stub fence in case of error.
769  */
770 static struct dma_fence *
771 amdgpu_gem_va_update_vm(struct amdgpu_device *adev,
772 			struct amdgpu_vm *vm,
773 			struct amdgpu_bo_va *bo_va,
774 			uint32_t operation)
775 {
776 	struct dma_fence *fence = dma_fence_get_stub();
777 	int r;
778 
779 	if (!amdgpu_vm_ready(vm))
780 		return fence;
781 
782 	r = amdgpu_vm_clear_freed(adev, vm, &fence);
783 	if (r)
784 		goto error;
785 
786 	if (operation == AMDGPU_VA_OP_MAP ||
787 	    operation == AMDGPU_VA_OP_REPLACE) {
788 		r = amdgpu_vm_bo_update(adev, bo_va, false);
789 		if (r)
790 			goto error;
791 	}
792 
793 	r = amdgpu_vm_update_pdes(adev, vm, false);
794 
795 error:
796 	if (r && r != -ERESTARTSYS)
797 		DRM_ERROR("Couldn't update BO_VA (%d)\n", r);
798 
799 	return fence;
800 }
801 
802 int amdgpu_gem_va_ioctl(struct drm_device *dev, void *data,
803 			  struct drm_file *filp)
804 {
805 	const uint32_t valid_flags = AMDGPU_VM_DELAY_UPDATE |
806 		AMDGPU_VM_PAGE_READABLE | AMDGPU_VM_PAGE_WRITEABLE |
807 		AMDGPU_VM_PAGE_EXECUTABLE | AMDGPU_VM_MTYPE_MASK |
808 		AMDGPU_VM_PAGE_NOALLOC;
809 	const uint32_t prt_flags = AMDGPU_VM_DELAY_UPDATE |
810 		AMDGPU_VM_PAGE_PRT;
811 
812 	struct drm_amdgpu_gem_va *args = data;
813 	struct drm_gem_object *gobj;
814 	struct amdgpu_device *adev = drm_to_adev(dev);
815 	struct amdgpu_fpriv *fpriv = filp->driver_priv;
816 	struct amdgpu_bo *abo;
817 	struct amdgpu_bo_va *bo_va;
818 	struct drm_syncobj *timeline_syncobj = NULL;
819 	struct dma_fence_chain *timeline_chain = NULL;
820 	struct dma_fence *fence;
821 	struct drm_exec exec;
822 	uint64_t vm_size;
823 	int r = 0;
824 
825 	if (args->va_address < AMDGPU_VA_RESERVED_BOTTOM) {
826 		dev_dbg(dev->dev,
827 			"va_address 0x%llx is in reserved area 0x%llx\n",
828 			args->va_address, AMDGPU_VA_RESERVED_BOTTOM);
829 		return -EINVAL;
830 	}
831 
832 	if (args->va_address >= AMDGPU_GMC_HOLE_START &&
833 	    args->va_address < AMDGPU_GMC_HOLE_END) {
834 		dev_dbg(dev->dev,
835 			"va_address 0x%llx is in VA hole 0x%llx-0x%llx\n",
836 			args->va_address, AMDGPU_GMC_HOLE_START,
837 			AMDGPU_GMC_HOLE_END);
838 		return -EINVAL;
839 	}
840 
841 	args->va_address &= AMDGPU_GMC_HOLE_MASK;
842 
843 	vm_size = adev->vm_manager.max_pfn * AMDGPU_GPU_PAGE_SIZE;
844 	vm_size -= AMDGPU_VA_RESERVED_TOP;
845 	if (args->va_address + args->map_size > vm_size) {
846 		dev_dbg(dev->dev,
847 			"va_address 0x%llx is in top reserved area 0x%llx\n",
848 			args->va_address + args->map_size, vm_size);
849 		return -EINVAL;
850 	}
851 
852 	if ((args->flags & ~valid_flags) && (args->flags & ~prt_flags)) {
853 		dev_dbg(dev->dev, "invalid flags combination 0x%08X\n",
854 			args->flags);
855 		return -EINVAL;
856 	}
857 
858 	switch (args->operation) {
859 	case AMDGPU_VA_OP_MAP:
860 	case AMDGPU_VA_OP_UNMAP:
861 	case AMDGPU_VA_OP_CLEAR:
862 	case AMDGPU_VA_OP_REPLACE:
863 		break;
864 	default:
865 		dev_dbg(dev->dev, "unsupported operation %d\n",
866 			args->operation);
867 		return -EINVAL;
868 	}
869 
870 	if ((args->operation != AMDGPU_VA_OP_CLEAR) &&
871 	    !(args->flags & AMDGPU_VM_PAGE_PRT)) {
872 		gobj = drm_gem_object_lookup(filp, args->handle);
873 		if (gobj == NULL)
874 			return -ENOENT;
875 		abo = gem_to_amdgpu_bo(gobj);
876 	} else {
877 		gobj = NULL;
878 		abo = NULL;
879 	}
880 
881 	r = amdgpu_gem_add_input_fence(filp,
882 				       args->input_fence_syncobj_handles,
883 				       args->num_syncobj_handles);
884 	if (r)
885 		goto error_put_gobj;
886 
887 	drm_exec_init(&exec, DRM_EXEC_INTERRUPTIBLE_WAIT |
888 		      DRM_EXEC_IGNORE_DUPLICATES, 0);
889 	drm_exec_until_all_locked(&exec) {
890 		if (gobj) {
891 			r = drm_exec_lock_obj(&exec, gobj);
892 			drm_exec_retry_on_contention(&exec);
893 			if (unlikely(r))
894 				goto error;
895 		}
896 
897 		r = amdgpu_vm_lock_pd(&fpriv->vm, &exec, 2);
898 		drm_exec_retry_on_contention(&exec);
899 		if (unlikely(r))
900 			goto error;
901 	}
902 
903 	if (abo) {
904 		bo_va = amdgpu_vm_bo_find(&fpriv->vm, abo);
905 		if (!bo_va) {
906 			r = -ENOENT;
907 			goto error;
908 		}
909 	} else if (args->operation != AMDGPU_VA_OP_CLEAR) {
910 		bo_va = fpriv->prt_va;
911 	} else {
912 		bo_va = NULL;
913 	}
914 
915 	r = amdgpu_gem_update_timeline_node(filp,
916 					    args->vm_timeline_syncobj_out,
917 					    args->vm_timeline_point,
918 					    &timeline_syncobj,
919 					    &timeline_chain);
920 	if (r)
921 		goto error;
922 
923 	switch (args->operation) {
924 	case AMDGPU_VA_OP_MAP:
925 		r = amdgpu_vm_bo_map(adev, bo_va, args->va_address,
926 				     args->offset_in_bo, args->map_size,
927 				     args->flags);
928 		break;
929 	case AMDGPU_VA_OP_UNMAP:
930 		r = amdgpu_vm_bo_unmap(adev, bo_va, args->va_address);
931 		break;
932 
933 	case AMDGPU_VA_OP_CLEAR:
934 		r = amdgpu_vm_bo_clear_mappings(adev, &fpriv->vm,
935 						args->va_address,
936 						args->map_size);
937 		break;
938 	case AMDGPU_VA_OP_REPLACE:
939 		r = amdgpu_vm_bo_replace_map(adev, bo_va, args->va_address,
940 					     args->offset_in_bo, args->map_size,
941 					     args->flags);
942 		break;
943 	default:
944 		break;
945 	}
946 	if (!r && !(args->flags & AMDGPU_VM_DELAY_UPDATE) && !adev->debug_vm) {
947 		fence = amdgpu_gem_va_update_vm(adev, &fpriv->vm, bo_va,
948 						args->operation);
949 
950 		if (timeline_syncobj)
951 			amdgpu_gem_update_bo_mapping(filp, bo_va,
952 					     args->operation,
953 					     args->vm_timeline_point,
954 					     fence, timeline_syncobj,
955 					     timeline_chain);
956 		else
957 			dma_fence_put(fence);
958 
959 	}
960 
961 error:
962 	drm_exec_fini(&exec);
963 error_put_gobj:
964 	drm_gem_object_put(gobj);
965 	return r;
966 }
967 
968 int amdgpu_gem_op_ioctl(struct drm_device *dev, void *data,
969 			struct drm_file *filp)
970 {
971 	struct drm_amdgpu_gem_op *args = data;
972 	struct drm_gem_object *gobj;
973 	struct amdgpu_vm_bo_base *base;
974 	struct amdgpu_bo *robj;
975 	struct drm_exec exec;
976 	struct amdgpu_fpriv *fpriv = filp->driver_priv;
977 	int r;
978 
979 	if (args->padding)
980 		return -EINVAL;
981 
982 	gobj = drm_gem_object_lookup(filp, args->handle);
983 	if (!gobj)
984 		return -ENOENT;
985 
986 	robj = gem_to_amdgpu_bo(gobj);
987 
988 	drm_exec_init(&exec, DRM_EXEC_INTERRUPTIBLE_WAIT |
989 			  DRM_EXEC_IGNORE_DUPLICATES, 0);
990 	drm_exec_until_all_locked(&exec) {
991 		r = drm_exec_lock_obj(&exec, gobj);
992 		drm_exec_retry_on_contention(&exec);
993 		if (r)
994 			goto out_exec;
995 
996 		if (args->op == AMDGPU_GEM_OP_GET_MAPPING_INFO) {
997 			r = amdgpu_vm_lock_pd(&fpriv->vm, &exec, 0);
998 			drm_exec_retry_on_contention(&exec);
999 			if (r)
1000 				goto out_exec;
1001 		}
1002 	}
1003 
1004 	switch (args->op) {
1005 	case AMDGPU_GEM_OP_GET_GEM_CREATE_INFO: {
1006 		struct drm_amdgpu_gem_create_in info;
1007 		void __user *out = u64_to_user_ptr(args->value);
1008 
1009 		info.bo_size = robj->tbo.base.size;
1010 		info.alignment = robj->tbo.page_alignment << PAGE_SHIFT;
1011 		info.domains = robj->preferred_domains;
1012 		info.domain_flags = robj->flags;
1013 		drm_exec_fini(&exec);
1014 		if (copy_to_user(out, &info, sizeof(info)))
1015 			r = -EFAULT;
1016 		break;
1017 	}
1018 	case AMDGPU_GEM_OP_SET_PLACEMENT:
1019 		if (drm_gem_is_imported(&robj->tbo.base) &&
1020 		    args->value & AMDGPU_GEM_DOMAIN_VRAM) {
1021 			r = -EINVAL;
1022 			goto out_exec;
1023 		}
1024 		if (amdgpu_ttm_tt_get_usermm(robj->tbo.ttm)) {
1025 			r = -EPERM;
1026 			goto out_exec;
1027 		}
1028 		for (base = robj->vm_bo; base; base = base->next)
1029 			if (amdgpu_xgmi_same_hive(amdgpu_ttm_adev(robj->tbo.bdev),
1030 				amdgpu_ttm_adev(base->vm->root.bo->tbo.bdev))) {
1031 				r = -EINVAL;
1032 				goto out_exec;
1033 			}
1034 
1035 
1036 		robj->preferred_domains = args->value & (AMDGPU_GEM_DOMAIN_VRAM |
1037 							AMDGPU_GEM_DOMAIN_GTT |
1038 							AMDGPU_GEM_DOMAIN_CPU);
1039 		robj->allowed_domains = robj->preferred_domains;
1040 		if (robj->allowed_domains == AMDGPU_GEM_DOMAIN_VRAM)
1041 			robj->allowed_domains |= AMDGPU_GEM_DOMAIN_GTT;
1042 
1043 		if (robj->flags & AMDGPU_GEM_CREATE_VM_ALWAYS_VALID)
1044 			amdgpu_vm_bo_invalidate(robj, true);
1045 		drm_exec_fini(&exec);
1046 		break;
1047 	case AMDGPU_GEM_OP_GET_MAPPING_INFO: {
1048 		struct amdgpu_bo_va *bo_va = amdgpu_vm_bo_find(&fpriv->vm, robj);
1049 		struct drm_amdgpu_gem_vm_entry *vm_entries;
1050 		struct amdgpu_bo_va_mapping *mapping;
1051 		int num_mappings = 0;
1052 		/*
1053 		 * num_entries is set as an input to the size of the user-allocated array of
1054 		 * drm_amdgpu_gem_vm_entry stored at args->value.
1055 		 * num_entries is sent back as output as the number of mappings the bo has.
1056 		 * If that number is larger than the size of the array, the ioctl must
1057 		 * be retried.
1058 		 */
1059 		vm_entries = kvcalloc(args->num_entries, sizeof(*vm_entries), GFP_KERNEL);
1060 		if (!vm_entries)
1061 			return -ENOMEM;
1062 
1063 		amdgpu_vm_bo_va_for_each_valid_mapping(bo_va, mapping) {
1064 			if (num_mappings < args->num_entries) {
1065 				vm_entries[num_mappings].addr = mapping->start * AMDGPU_GPU_PAGE_SIZE;
1066 				vm_entries[num_mappings].size = (mapping->last - mapping->start + 1) * AMDGPU_GPU_PAGE_SIZE;
1067 				vm_entries[num_mappings].offset = mapping->offset;
1068 				vm_entries[num_mappings].flags = mapping->flags;
1069 			}
1070 			num_mappings += 1;
1071 		}
1072 
1073 		amdgpu_vm_bo_va_for_each_invalid_mapping(bo_va, mapping) {
1074 			if (num_mappings < args->num_entries) {
1075 				vm_entries[num_mappings].addr = mapping->start * AMDGPU_GPU_PAGE_SIZE;
1076 				vm_entries[num_mappings].size = (mapping->last - mapping->start + 1) * AMDGPU_GPU_PAGE_SIZE;
1077 				vm_entries[num_mappings].offset = mapping->offset;
1078 				vm_entries[num_mappings].flags = mapping->flags;
1079 			}
1080 			num_mappings += 1;
1081 		}
1082 
1083 		drm_exec_fini(&exec);
1084 
1085 		if (num_mappings > 0 && num_mappings <= args->num_entries)
1086 			if (copy_to_user(u64_to_user_ptr(args->value), vm_entries, num_mappings * sizeof(*vm_entries)))
1087 				r = -EFAULT;
1088 
1089 		args->num_entries = num_mappings;
1090 
1091 		kvfree(vm_entries);
1092 		break;
1093 	}
1094 	default:
1095 		drm_exec_fini(&exec);
1096 		r = -EINVAL;
1097 	}
1098 
1099 	drm_gem_object_put(gobj);
1100 	return r;
1101 out_exec:
1102 	drm_exec_fini(&exec);
1103 	drm_gem_object_put(gobj);
1104 	return r;
1105 }
1106 
1107 /**
1108  * amdgpu_gem_list_handles_ioctl - get information about a process' buffer objects
1109  *
1110  * @dev: drm device pointer
1111  * @data: drm_amdgpu_gem_list_handles
1112  * @filp: drm file pointer
1113  *
1114  * num_entries is set as an input to the size of the entries array.
1115  * num_entries is sent back as output as the number of bos in the process.
1116  * If that number is larger than the size of the array, the ioctl must
1117  * be retried.
1118  *
1119  * Returns:
1120  * 0 for success, -errno for errors.
1121  */
1122 int amdgpu_gem_list_handles_ioctl(struct drm_device *dev, void *data,
1123 				  struct drm_file *filp)
1124 {
1125 	struct drm_amdgpu_gem_list_handles *args = data;
1126 	struct drm_amdgpu_gem_list_handles_entry *bo_entries;
1127 	struct drm_gem_object *gobj;
1128 	int id, ret = 0;
1129 	int bo_index = 0;
1130 	int num_bos = 0;
1131 
1132 	spin_lock(&filp->table_lock);
1133 	idr_for_each_entry(&filp->object_idr, gobj, id)
1134 		num_bos += 1;
1135 	spin_unlock(&filp->table_lock);
1136 
1137 	if (args->num_entries < num_bos) {
1138 		args->num_entries = num_bos;
1139 		return 0;
1140 	}
1141 
1142 	if (num_bos == 0) {
1143 		args->num_entries = 0;
1144 		return 0;
1145 	}
1146 
1147 	bo_entries = kvcalloc(num_bos, sizeof(*bo_entries), GFP_KERNEL);
1148 	if (!bo_entries)
1149 		return -ENOMEM;
1150 
1151 	spin_lock(&filp->table_lock);
1152 	idr_for_each_entry(&filp->object_idr, gobj, id) {
1153 		struct amdgpu_bo *bo = gem_to_amdgpu_bo(gobj);
1154 		struct drm_amdgpu_gem_list_handles_entry *bo_entry;
1155 
1156 		if (bo_index >= num_bos) {
1157 			ret = -EAGAIN;
1158 			break;
1159 		}
1160 
1161 		bo_entry = &bo_entries[bo_index];
1162 
1163 		bo_entry->size = amdgpu_bo_size(bo);
1164 		bo_entry->alloc_flags = bo->flags & AMDGPU_GEM_CREATE_SETTABLE_MASK;
1165 		bo_entry->preferred_domains = bo->preferred_domains;
1166 		bo_entry->gem_handle = id;
1167 		bo_entry->alignment = bo->tbo.page_alignment;
1168 
1169 		if (bo->tbo.base.import_attach)
1170 			bo_entry->flags |= AMDGPU_GEM_LIST_HANDLES_FLAG_IS_IMPORT;
1171 
1172 		bo_index += 1;
1173 	}
1174 	spin_unlock(&filp->table_lock);
1175 
1176 	args->num_entries = bo_index;
1177 
1178 	if (!ret)
1179 		if (copy_to_user(u64_to_user_ptr(args->entries), bo_entries, num_bos * sizeof(*bo_entries)))
1180 			ret = -EFAULT;
1181 
1182 	kvfree(bo_entries);
1183 
1184 	return ret;
1185 }
1186 
1187 static int amdgpu_gem_align_pitch(struct amdgpu_device *adev,
1188 				  int width,
1189 				  int cpp,
1190 				  bool tiled)
1191 {
1192 	int aligned = width;
1193 	int pitch_mask = 0;
1194 
1195 	switch (cpp) {
1196 	case 1:
1197 		pitch_mask = 255;
1198 		break;
1199 	case 2:
1200 		pitch_mask = 127;
1201 		break;
1202 	case 3:
1203 	case 4:
1204 		pitch_mask = 63;
1205 		break;
1206 	}
1207 
1208 	aligned += pitch_mask;
1209 	aligned &= ~pitch_mask;
1210 	return aligned * cpp;
1211 }
1212 
1213 int amdgpu_mode_dumb_create(struct drm_file *file_priv,
1214 			    struct drm_device *dev,
1215 			    struct drm_mode_create_dumb *args)
1216 {
1217 	struct amdgpu_device *adev = drm_to_adev(dev);
1218 	struct amdgpu_fpriv *fpriv = file_priv->driver_priv;
1219 	struct drm_gem_object *gobj;
1220 	uint32_t handle;
1221 	u64 flags = AMDGPU_GEM_CREATE_CPU_ACCESS_REQUIRED |
1222 		    AMDGPU_GEM_CREATE_CPU_GTT_USWC |
1223 		    AMDGPU_GEM_CREATE_VRAM_CONTIGUOUS;
1224 	u32 domain;
1225 	int r;
1226 
1227 	/*
1228 	 * The buffer returned from this function should be cleared, but
1229 	 * it can only be done if the ring is enabled or we'll fail to
1230 	 * create the buffer.
1231 	 */
1232 	if (adev->mman.buffer_funcs_enabled)
1233 		flags |= AMDGPU_GEM_CREATE_VRAM_CLEARED;
1234 
1235 	args->pitch = amdgpu_gem_align_pitch(adev, args->width,
1236 					     DIV_ROUND_UP(args->bpp, 8), 0);
1237 	args->size = (u64)args->pitch * args->height;
1238 	args->size = ALIGN(args->size, PAGE_SIZE);
1239 	domain = amdgpu_bo_get_preferred_domain(adev,
1240 				amdgpu_display_supported_domains(adev, flags));
1241 	r = amdgpu_gem_object_create(adev, args->size, 0, domain, flags,
1242 				     ttm_bo_type_device, NULL, &gobj, fpriv->xcp_id + 1);
1243 	if (r)
1244 		return -ENOMEM;
1245 
1246 	r = drm_gem_handle_create(file_priv, gobj, &handle);
1247 	/* drop reference from allocate - handle holds it now */
1248 	drm_gem_object_put(gobj);
1249 	if (r)
1250 		return r;
1251 
1252 	args->handle = handle;
1253 	return 0;
1254 }
1255 
1256 #if defined(CONFIG_DEBUG_FS)
1257 static int amdgpu_debugfs_gem_info_show(struct seq_file *m, void *unused)
1258 {
1259 	struct amdgpu_device *adev = m->private;
1260 	struct drm_device *dev = adev_to_drm(adev);
1261 	struct drm_file *file;
1262 	int r;
1263 
1264 	r = mutex_lock_interruptible(&dev->filelist_mutex);
1265 	if (r)
1266 		return r;
1267 
1268 	list_for_each_entry(file, &dev->filelist, lhead) {
1269 		struct task_struct *task;
1270 		struct drm_gem_object *gobj;
1271 		struct pid *pid;
1272 		int id;
1273 
1274 		/*
1275 		 * Although we have a valid reference on file->pid, that does
1276 		 * not guarantee that the task_struct who called get_pid() is
1277 		 * still alive (e.g. get_pid(current) => fork() => exit()).
1278 		 * Therefore, we need to protect this ->comm access using RCU.
1279 		 */
1280 		rcu_read_lock();
1281 		pid = rcu_dereference(file->pid);
1282 		task = pid_task(pid, PIDTYPE_TGID);
1283 		seq_printf(m, "pid %8d command %s:\n", pid_nr(pid),
1284 			   task ? task->comm : "<unknown>");
1285 		rcu_read_unlock();
1286 
1287 		spin_lock(&file->table_lock);
1288 		idr_for_each_entry(&file->object_idr, gobj, id) {
1289 			struct amdgpu_bo *bo = gem_to_amdgpu_bo(gobj);
1290 
1291 			amdgpu_bo_print_info(id, bo, m);
1292 		}
1293 		spin_unlock(&file->table_lock);
1294 	}
1295 
1296 	mutex_unlock(&dev->filelist_mutex);
1297 	return 0;
1298 }
1299 
1300 DEFINE_SHOW_ATTRIBUTE(amdgpu_debugfs_gem_info);
1301 
1302 #endif
1303 
1304 void amdgpu_debugfs_gem_init(struct amdgpu_device *adev)
1305 {
1306 #if defined(CONFIG_DEBUG_FS)
1307 	struct drm_minor *minor = adev_to_drm(adev)->primary;
1308 	struct dentry *root = minor->debugfs_root;
1309 
1310 	debugfs_create_file("amdgpu_gem_info", 0444, root, adev,
1311 			    &amdgpu_debugfs_gem_info_fops);
1312 #endif
1313 }
1314