xref: /linux/drivers/gpu/drm/v3d/v3d_bo.c (revision 2c1ed907520c50326b8f604907a8478b27881a2e)
1 // SPDX-License-Identifier: GPL-2.0+
2 /* Copyright (C) 2015-2018 Broadcom */
3 
4 /**
5  * DOC: V3D GEM BO management support
6  *
7  * Compared to VC4 (V3D 2.x), V3D 3.3 introduces an MMU between the
8  * GPU and the bus, allowing us to use shmem objects for our storage
9  * instead of CMA.
10  *
11  * Physically contiguous objects may still be imported to V3D, but the
12  * driver doesn't allocate physically contiguous objects on its own.
13  * Display engines requiring physically contiguous allocations should
14  * look into Mesa's "renderonly" support (as used by the Mesa pl111
15  * driver) for an example of how to integrate with V3D.
16  */
17 
18 #include <linux/dma-buf.h>
19 #include <linux/pfn_t.h>
20 #include <linux/vmalloc.h>
21 
22 #include "v3d_drv.h"
23 #include "uapi/drm/v3d_drm.h"
24 
v3d_gem_status(struct drm_gem_object * obj)25 static enum drm_gem_object_status v3d_gem_status(struct drm_gem_object *obj)
26 {
27 	struct v3d_bo *bo = to_v3d_bo(obj);
28 	enum drm_gem_object_status res = 0;
29 
30 	if (bo->base.pages)
31 		res |= DRM_GEM_OBJECT_RESIDENT;
32 
33 	return res;
34 }
35 
36 /* Called DRM core on the last userspace/kernel unreference of the
37  * BO.
38  */
v3d_free_object(struct drm_gem_object * obj)39 void v3d_free_object(struct drm_gem_object *obj)
40 {
41 	struct v3d_dev *v3d = to_v3d_dev(obj->dev);
42 	struct v3d_bo *bo = to_v3d_bo(obj);
43 
44 	if (bo->vaddr)
45 		v3d_put_bo_vaddr(bo);
46 
47 	v3d_mmu_remove_ptes(bo);
48 
49 	mutex_lock(&v3d->bo_lock);
50 	v3d->bo_stats.num_allocated--;
51 	v3d->bo_stats.pages_allocated -= obj->size >> V3D_MMU_PAGE_SHIFT;
52 	mutex_unlock(&v3d->bo_lock);
53 
54 	spin_lock(&v3d->mm_lock);
55 	drm_mm_remove_node(&bo->node);
56 	spin_unlock(&v3d->mm_lock);
57 
58 	/* GPU execution may have dirtied any pages in the BO. */
59 	bo->base.pages_mark_dirty_on_put = true;
60 
61 	drm_gem_shmem_free(&bo->base);
62 }
63 
64 static const struct drm_gem_object_funcs v3d_gem_funcs = {
65 	.free = v3d_free_object,
66 	.print_info = drm_gem_shmem_object_print_info,
67 	.pin = drm_gem_shmem_object_pin,
68 	.unpin = drm_gem_shmem_object_unpin,
69 	.get_sg_table = drm_gem_shmem_object_get_sg_table,
70 	.vmap = drm_gem_shmem_object_vmap,
71 	.vunmap = drm_gem_shmem_object_vunmap,
72 	.mmap = drm_gem_shmem_object_mmap,
73 	.status = v3d_gem_status,
74 	.vm_ops = &drm_gem_shmem_vm_ops,
75 };
76 
77 /* gem_create_object function for allocating a BO struct and doing
78  * early setup.
79  */
v3d_create_object(struct drm_device * dev,size_t size)80 struct drm_gem_object *v3d_create_object(struct drm_device *dev, size_t size)
81 {
82 	struct v3d_bo *bo;
83 	struct drm_gem_object *obj;
84 
85 	if (size == 0)
86 		return ERR_PTR(-EINVAL);
87 
88 	bo = kzalloc(sizeof(*bo), GFP_KERNEL);
89 	if (!bo)
90 		return ERR_PTR(-ENOMEM);
91 	obj = &bo->base.base;
92 
93 	obj->funcs = &v3d_gem_funcs;
94 	bo->base.map_wc = true;
95 	INIT_LIST_HEAD(&bo->unref_head);
96 
97 	return &bo->base.base;
98 }
99 
100 static int
v3d_bo_create_finish(struct drm_gem_object * obj)101 v3d_bo_create_finish(struct drm_gem_object *obj)
102 {
103 	struct v3d_dev *v3d = to_v3d_dev(obj->dev);
104 	struct v3d_bo *bo = to_v3d_bo(obj);
105 	struct sg_table *sgt;
106 	u64 align;
107 	int ret;
108 
109 	/* So far we pin the BO in the MMU for its lifetime, so use
110 	 * shmem's helper for getting a lifetime sgt.
111 	 */
112 	sgt = drm_gem_shmem_get_pages_sgt(&bo->base);
113 	if (IS_ERR(sgt))
114 		return PTR_ERR(sgt);
115 
116 	if (!v3d->gemfs)
117 		align = SZ_4K;
118 	else if (obj->size >= SZ_1M)
119 		align = SZ_1M;
120 	else if (obj->size >= SZ_64K)
121 		align = SZ_64K;
122 	else
123 		align = SZ_4K;
124 
125 	spin_lock(&v3d->mm_lock);
126 	/* Allocate the object's space in the GPU's page tables.
127 	 * Inserting PTEs will happen later, but the offset is for the
128 	 * lifetime of the BO.
129 	 */
130 	ret = drm_mm_insert_node_generic(&v3d->mm, &bo->node,
131 					 obj->size >> V3D_MMU_PAGE_SHIFT,
132 					 align >> V3D_MMU_PAGE_SHIFT, 0, 0);
133 	spin_unlock(&v3d->mm_lock);
134 	if (ret)
135 		return ret;
136 
137 	/* Track stats for /debug/dri/n/bo_stats. */
138 	mutex_lock(&v3d->bo_lock);
139 	v3d->bo_stats.num_allocated++;
140 	v3d->bo_stats.pages_allocated += obj->size >> V3D_MMU_PAGE_SHIFT;
141 	mutex_unlock(&v3d->bo_lock);
142 
143 	v3d_mmu_insert_ptes(bo);
144 
145 	return 0;
146 }
147 
v3d_bo_create(struct drm_device * dev,struct drm_file * file_priv,size_t unaligned_size)148 struct v3d_bo *v3d_bo_create(struct drm_device *dev, struct drm_file *file_priv,
149 			     size_t unaligned_size)
150 {
151 	struct drm_gem_shmem_object *shmem_obj;
152 	struct v3d_dev *v3d = to_v3d_dev(dev);
153 	struct v3d_bo *bo;
154 	int ret;
155 
156 	shmem_obj = drm_gem_shmem_create_with_mnt(dev, unaligned_size,
157 						  v3d->gemfs);
158 	if (IS_ERR(shmem_obj))
159 		return ERR_CAST(shmem_obj);
160 	bo = to_v3d_bo(&shmem_obj->base);
161 	bo->vaddr = NULL;
162 
163 	ret = v3d_bo_create_finish(&shmem_obj->base);
164 	if (ret)
165 		goto free_obj;
166 
167 	return bo;
168 
169 free_obj:
170 	drm_gem_shmem_free(shmem_obj);
171 	return ERR_PTR(ret);
172 }
173 
174 struct drm_gem_object *
v3d_prime_import_sg_table(struct drm_device * dev,struct dma_buf_attachment * attach,struct sg_table * sgt)175 v3d_prime_import_sg_table(struct drm_device *dev,
176 			  struct dma_buf_attachment *attach,
177 			  struct sg_table *sgt)
178 {
179 	struct drm_gem_object *obj;
180 	int ret;
181 
182 	obj = drm_gem_shmem_prime_import_sg_table(dev, attach, sgt);
183 	if (IS_ERR(obj))
184 		return obj;
185 
186 	ret = v3d_bo_create_finish(obj);
187 	if (ret) {
188 		drm_gem_shmem_free(&to_v3d_bo(obj)->base);
189 		return ERR_PTR(ret);
190 	}
191 
192 	return obj;
193 }
194 
v3d_get_bo_vaddr(struct v3d_bo * bo)195 void v3d_get_bo_vaddr(struct v3d_bo *bo)
196 {
197 	struct drm_gem_shmem_object *obj = &bo->base;
198 
199 	bo->vaddr = vmap(obj->pages, obj->base.size >> PAGE_SHIFT, VM_MAP,
200 			 pgprot_writecombine(PAGE_KERNEL));
201 }
202 
v3d_put_bo_vaddr(struct v3d_bo * bo)203 void v3d_put_bo_vaddr(struct v3d_bo *bo)
204 {
205 	vunmap(bo->vaddr);
206 	bo->vaddr = NULL;
207 }
208 
v3d_create_bo_ioctl(struct drm_device * dev,void * data,struct drm_file * file_priv)209 int v3d_create_bo_ioctl(struct drm_device *dev, void *data,
210 			struct drm_file *file_priv)
211 {
212 	struct drm_v3d_create_bo *args = data;
213 	struct v3d_bo *bo = NULL;
214 	int ret;
215 
216 	if (args->flags != 0) {
217 		DRM_INFO("unknown create_bo flags: %d\n", args->flags);
218 		return -EINVAL;
219 	}
220 
221 	bo = v3d_bo_create(dev, file_priv, PAGE_ALIGN(args->size));
222 	if (IS_ERR(bo))
223 		return PTR_ERR(bo);
224 
225 	args->offset = bo->node.start << V3D_MMU_PAGE_SHIFT;
226 
227 	ret = drm_gem_handle_create(file_priv, &bo->base.base, &args->handle);
228 	drm_gem_object_put(&bo->base.base);
229 
230 	return ret;
231 }
232 
v3d_mmap_bo_ioctl(struct drm_device * dev,void * data,struct drm_file * file_priv)233 int v3d_mmap_bo_ioctl(struct drm_device *dev, void *data,
234 		      struct drm_file *file_priv)
235 {
236 	struct drm_v3d_mmap_bo *args = data;
237 	struct drm_gem_object *gem_obj;
238 
239 	if (args->flags != 0) {
240 		DRM_INFO("unknown mmap_bo flags: %d\n", args->flags);
241 		return -EINVAL;
242 	}
243 
244 	gem_obj = drm_gem_object_lookup(file_priv, args->handle);
245 	if (!gem_obj) {
246 		DRM_DEBUG("Failed to look up GEM BO %d\n", args->handle);
247 		return -ENOENT;
248 	}
249 
250 	args->offset = drm_vma_node_offset_addr(&gem_obj->vma_node);
251 	drm_gem_object_put(gem_obj);
252 
253 	return 0;
254 }
255 
v3d_get_bo_offset_ioctl(struct drm_device * dev,void * data,struct drm_file * file_priv)256 int v3d_get_bo_offset_ioctl(struct drm_device *dev, void *data,
257 			    struct drm_file *file_priv)
258 {
259 	struct drm_v3d_get_bo_offset *args = data;
260 	struct drm_gem_object *gem_obj;
261 	struct v3d_bo *bo;
262 
263 	gem_obj = drm_gem_object_lookup(file_priv, args->handle);
264 	if (!gem_obj) {
265 		DRM_DEBUG("Failed to look up GEM BO %d\n", args->handle);
266 		return -ENOENT;
267 	}
268 	bo = to_v3d_bo(gem_obj);
269 
270 	args->offset = bo->node.start << V3D_MMU_PAGE_SHIFT;
271 
272 	drm_gem_object_put(gem_obj);
273 	return 0;
274 }
275 
276 int
v3d_wait_bo_ioctl(struct drm_device * dev,void * data,struct drm_file * file_priv)277 v3d_wait_bo_ioctl(struct drm_device *dev, void *data,
278 		  struct drm_file *file_priv)
279 {
280 	int ret;
281 	struct drm_v3d_wait_bo *args = data;
282 	ktime_t start = ktime_get();
283 	u64 delta_ns;
284 	unsigned long timeout_jiffies =
285 		nsecs_to_jiffies_timeout(args->timeout_ns);
286 
287 	if (args->pad != 0)
288 		return -EINVAL;
289 
290 	ret = drm_gem_dma_resv_wait(file_priv, args->handle,
291 				    true, timeout_jiffies);
292 
293 	/* Decrement the user's timeout, in case we got interrupted
294 	 * such that the ioctl will be restarted.
295 	 */
296 	delta_ns = ktime_to_ns(ktime_sub(ktime_get(), start));
297 	if (delta_ns < args->timeout_ns)
298 		args->timeout_ns -= delta_ns;
299 	else
300 		args->timeout_ns = 0;
301 
302 	/* Asked to wait beyond the jiffy/scheduler precision? */
303 	if (ret == -ETIME && args->timeout_ns)
304 		ret = -EAGAIN;
305 
306 	return ret;
307 }
308