xref: /linux/drivers/gpu/drm/amd/amdgpu/amdgpu_eviction_fence.c (revision e332935a540eb76dd656663ca908eb0544d96757)
1 // SPDX-License-Identifier: MIT
2 /*
3  * Copyright 2024 Advanced Micro Devices, Inc.
4  *
5  * Permission is hereby granted, free of charge, to any person obtaining a
6  * copy of this software and associated documentation files (the "Software"),
7  * to deal in the Software without restriction, including without limitation
8  * the rights to use, copy, modify, merge, publish, distribute, sublicense,
9  * and/or sell copies of the Software, and to permit persons to whom the
10  * Software is furnished to do so, subject to the following conditions:
11  *
12  * The above copyright notice and this permission notice shall be included in
13  * all copies or substantial portions of the Software.
14  *
15  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
18  * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
19  * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
20  * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
21  * OTHER DEALINGS IN THE SOFTWARE.
22  *
23  */
24 #include <linux/sched.h>
25 #include <drm/drm_exec.h>
26 #include "amdgpu.h"
27 
28 #define work_to_evf_mgr(w, name) container_of(w, struct amdgpu_eviction_fence_mgr, name)
29 #define evf_mgr_to_fpriv(e) container_of(e, struct amdgpu_fpriv, evf_mgr)
30 
31 static const char *
amdgpu_eviction_fence_get_driver_name(struct dma_fence * fence)32 amdgpu_eviction_fence_get_driver_name(struct dma_fence *fence)
33 {
34 	return "amdgpu_eviction_fence";
35 }
36 
37 static const char *
amdgpu_eviction_fence_get_timeline_name(struct dma_fence * f)38 amdgpu_eviction_fence_get_timeline_name(struct dma_fence *f)
39 {
40 	struct amdgpu_eviction_fence *ef;
41 
42 	ef = container_of(f, struct amdgpu_eviction_fence, base);
43 	return ef->timeline_name;
44 }
45 
46 int
amdgpu_eviction_fence_replace_fence(struct amdgpu_eviction_fence_mgr * evf_mgr,struct drm_exec * exec)47 amdgpu_eviction_fence_replace_fence(struct amdgpu_eviction_fence_mgr *evf_mgr,
48 				    struct drm_exec *exec)
49 {
50 	struct amdgpu_eviction_fence *old_ef, *new_ef;
51 	struct drm_gem_object *obj;
52 	unsigned long index;
53 	int ret;
54 
55 	if (evf_mgr->ev_fence &&
56 	    !dma_fence_is_signaled(&evf_mgr->ev_fence->base))
57 		return 0;
58 	/*
59 	 * Steps to replace eviction fence:
60 	 * * lock all objects in exec (caller)
61 	 * * create a new eviction fence
62 	 * * update new eviction fence in evf_mgr
63 	 * * attach the new eviction fence to BOs
64 	 * * release the old fence
65 	 * * unlock the objects (caller)
66 	 */
67 	new_ef = amdgpu_eviction_fence_create(evf_mgr);
68 	if (!new_ef) {
69 		DRM_ERROR("Failed to create new eviction fence\n");
70 		return -ENOMEM;
71 	}
72 
73 	/* Update the eviction fence now */
74 	spin_lock(&evf_mgr->ev_fence_lock);
75 	old_ef = evf_mgr->ev_fence;
76 	evf_mgr->ev_fence = new_ef;
77 	spin_unlock(&evf_mgr->ev_fence_lock);
78 
79 	/* Attach the new fence */
80 	drm_exec_for_each_locked_object(exec, index, obj) {
81 		struct amdgpu_bo *bo = gem_to_amdgpu_bo(obj);
82 
83 		if (!bo)
84 			continue;
85 		ret = amdgpu_eviction_fence_attach(evf_mgr, bo);
86 		if (ret) {
87 			DRM_ERROR("Failed to attch new eviction fence\n");
88 			goto free_err;
89 		}
90 	}
91 
92 	/* Free old fence */
93 	if (old_ef)
94 		dma_fence_put(&old_ef->base);
95 	return 0;
96 
97 free_err:
98 	kfree(new_ef);
99 	return ret;
100 }
101 
102 static void
amdgpu_eviction_fence_suspend_worker(struct work_struct * work)103 amdgpu_eviction_fence_suspend_worker(struct work_struct *work)
104 {
105 	struct amdgpu_eviction_fence_mgr *evf_mgr = work_to_evf_mgr(work, suspend_work.work);
106 	struct amdgpu_fpriv *fpriv = evf_mgr_to_fpriv(evf_mgr);
107 	struct amdgpu_userq_mgr *uq_mgr = &fpriv->userq_mgr;
108 	struct amdgpu_eviction_fence *ev_fence;
109 
110 	mutex_lock(&uq_mgr->userq_mutex);
111 	spin_lock(&evf_mgr->ev_fence_lock);
112 	ev_fence = evf_mgr->ev_fence;
113 	if (ev_fence)
114 		dma_fence_get(&ev_fence->base);
115 	else
116 		goto unlock;
117 	spin_unlock(&evf_mgr->ev_fence_lock);
118 
119 	amdgpu_userq_evict(uq_mgr, ev_fence);
120 
121 	mutex_unlock(&uq_mgr->userq_mutex);
122 	dma_fence_put(&ev_fence->base);
123 	return;
124 
125 unlock:
126 	spin_unlock(&evf_mgr->ev_fence_lock);
127 	mutex_unlock(&uq_mgr->userq_mutex);
128 }
129 
amdgpu_eviction_fence_enable_signaling(struct dma_fence * f)130 static bool amdgpu_eviction_fence_enable_signaling(struct dma_fence *f)
131 {
132 	struct amdgpu_eviction_fence_mgr *evf_mgr;
133 	struct amdgpu_eviction_fence *ev_fence;
134 
135 	if (!f)
136 		return true;
137 
138 	ev_fence = to_ev_fence(f);
139 	evf_mgr = ev_fence->evf_mgr;
140 
141 	schedule_delayed_work(&evf_mgr->suspend_work, 0);
142 	return true;
143 }
144 
145 static const struct dma_fence_ops amdgpu_eviction_fence_ops = {
146 	.use_64bit_seqno = true,
147 	.get_driver_name = amdgpu_eviction_fence_get_driver_name,
148 	.get_timeline_name = amdgpu_eviction_fence_get_timeline_name,
149 	.enable_signaling = amdgpu_eviction_fence_enable_signaling,
150 };
151 
amdgpu_eviction_fence_signal(struct amdgpu_eviction_fence_mgr * evf_mgr,struct amdgpu_eviction_fence * ev_fence)152 void amdgpu_eviction_fence_signal(struct amdgpu_eviction_fence_mgr *evf_mgr,
153 				  struct amdgpu_eviction_fence *ev_fence)
154 {
155 	spin_lock(&evf_mgr->ev_fence_lock);
156 	dma_fence_signal(&ev_fence->base);
157 	spin_unlock(&evf_mgr->ev_fence_lock);
158 }
159 
160 struct amdgpu_eviction_fence *
amdgpu_eviction_fence_create(struct amdgpu_eviction_fence_mgr * evf_mgr)161 amdgpu_eviction_fence_create(struct amdgpu_eviction_fence_mgr *evf_mgr)
162 {
163 	struct amdgpu_eviction_fence *ev_fence;
164 
165 	ev_fence = kzalloc(sizeof(*ev_fence), GFP_KERNEL);
166 	if (!ev_fence)
167 		return NULL;
168 
169 	ev_fence->evf_mgr = evf_mgr;
170 	get_task_comm(ev_fence->timeline_name, current);
171 	spin_lock_init(&ev_fence->lock);
172 	dma_fence_init(&ev_fence->base, &amdgpu_eviction_fence_ops,
173 		       &ev_fence->lock, evf_mgr->ev_fence_ctx,
174 		       atomic_inc_return(&evf_mgr->ev_fence_seq));
175 	return ev_fence;
176 }
177 
amdgpu_eviction_fence_destroy(struct amdgpu_eviction_fence_mgr * evf_mgr)178 void amdgpu_eviction_fence_destroy(struct amdgpu_eviction_fence_mgr *evf_mgr)
179 {
180 	struct amdgpu_eviction_fence *ev_fence;
181 
182 	/* Wait for any pending work to execute */
183 	flush_delayed_work(&evf_mgr->suspend_work);
184 
185 	spin_lock(&evf_mgr->ev_fence_lock);
186 	ev_fence = evf_mgr->ev_fence;
187 	spin_unlock(&evf_mgr->ev_fence_lock);
188 
189 	if (!ev_fence)
190 		return;
191 
192 	dma_fence_wait(&ev_fence->base, false);
193 
194 	/* Last unref of ev_fence */
195 	dma_fence_put(&ev_fence->base);
196 }
197 
amdgpu_eviction_fence_attach(struct amdgpu_eviction_fence_mgr * evf_mgr,struct amdgpu_bo * bo)198 int amdgpu_eviction_fence_attach(struct amdgpu_eviction_fence_mgr *evf_mgr,
199 				 struct amdgpu_bo *bo)
200 {
201 	struct amdgpu_eviction_fence *ev_fence;
202 	struct dma_resv *resv = bo->tbo.base.resv;
203 	int ret;
204 
205 	if (!resv)
206 		return 0;
207 
208 	ret = dma_resv_reserve_fences(resv, 1);
209 	if (ret) {
210 		DRM_DEBUG_DRIVER("Failed to resv fence space\n");
211 		return ret;
212 	}
213 
214 	spin_lock(&evf_mgr->ev_fence_lock);
215 	ev_fence = evf_mgr->ev_fence;
216 	if (ev_fence)
217 		dma_resv_add_fence(resv, &ev_fence->base, DMA_RESV_USAGE_BOOKKEEP);
218 	spin_unlock(&evf_mgr->ev_fence_lock);
219 
220 	return 0;
221 }
222 
amdgpu_eviction_fence_detach(struct amdgpu_eviction_fence_mgr * evf_mgr,struct amdgpu_bo * bo)223 void amdgpu_eviction_fence_detach(struct amdgpu_eviction_fence_mgr *evf_mgr,
224 				  struct amdgpu_bo *bo)
225 {
226 	struct dma_fence *stub = dma_fence_get_stub();
227 
228 	dma_resv_replace_fences(bo->tbo.base.resv, evf_mgr->ev_fence_ctx,
229 				stub, DMA_RESV_USAGE_BOOKKEEP);
230 	dma_fence_put(stub);
231 }
232 
amdgpu_eviction_fence_init(struct amdgpu_eviction_fence_mgr * evf_mgr)233 int amdgpu_eviction_fence_init(struct amdgpu_eviction_fence_mgr *evf_mgr)
234 {
235 	/* This needs to be done one time per open */
236 	atomic_set(&evf_mgr->ev_fence_seq, 0);
237 	evf_mgr->ev_fence_ctx = dma_fence_context_alloc(1);
238 	spin_lock_init(&evf_mgr->ev_fence_lock);
239 
240 	INIT_DELAYED_WORK(&evf_mgr->suspend_work, amdgpu_eviction_fence_suspend_worker);
241 	return 0;
242 }
243