xref: /linux/drivers/infiniband/core/rdma_core.c (revision b9b77222d4ff6b5bb8f5d87fca20de0910618bb9)
1 /*
2  * Copyright (c) 2016, Mellanox Technologies inc.  All rights reserved.
3  *
4  * This software is available to you under a choice of one of two
5  * licenses.  You may choose to be licensed under the terms of the GNU
6  * General Public License (GPL) Version 2, available from the file
7  * COPYING in the main directory of this source tree, or the
8  * OpenIB.org BSD license below:
9  *
10  *     Redistribution and use in source and binary forms, with or
11  *     without modification, are permitted provided that the following
12  *     conditions are met:
13  *
14  *      - Redistributions of source code must retain the above
15  *        copyright notice, this list of conditions and the following
16  *        disclaimer.
17  *
18  *      - Redistributions in binary form must reproduce the above
19  *        copyright notice, this list of conditions and the following
20  *        disclaimer in the documentation and/or other materials
21  *        provided with the distribution.
22  *
23  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
24  * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
25  * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
26  * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
27  * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
28  * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
29  * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
30  * SOFTWARE.
31  */
32 
33 #include <linux/file.h>
34 #include <linux/anon_inodes.h>
35 #include <rdma/ib_verbs.h>
36 #include <rdma/uverbs_types.h>
37 #include <linux/rcupdate.h>
38 #include <rdma/uverbs_ioctl.h>
39 #include <rdma/rdma_user_ioctl.h>
40 #include "uverbs.h"
41 #include "core_priv.h"
42 #include "rdma_core.h"
43 
44 int uverbs_ns_idx(u16 *id, unsigned int ns_count)
45 {
46 	int ret = (*id & UVERBS_ID_NS_MASK) >> UVERBS_ID_NS_SHIFT;
47 
48 	if (ret >= ns_count)
49 		return -EINVAL;
50 
51 	*id &= ~UVERBS_ID_NS_MASK;
52 	return ret;
53 }
54 
55 const struct uverbs_object_spec *uverbs_get_object(const struct ib_device *ibdev,
56 						   uint16_t object)
57 {
58 	const struct uverbs_root_spec *object_hash = ibdev->specs_root;
59 	const struct uverbs_object_spec_hash *objects;
60 	int ret = uverbs_ns_idx(&object, object_hash->num_buckets);
61 
62 	if (ret < 0)
63 		return NULL;
64 
65 	objects = object_hash->object_buckets[ret];
66 
67 	if (object >= objects->num_objects)
68 		return NULL;
69 
70 	return objects->objects[object];
71 }
72 
73 const struct uverbs_method_spec *uverbs_get_method(const struct uverbs_object_spec *object,
74 						   uint16_t method)
75 {
76 	const struct uverbs_method_spec_hash *methods;
77 	int ret = uverbs_ns_idx(&method, object->num_buckets);
78 
79 	if (ret < 0)
80 		return NULL;
81 
82 	methods = object->method_buckets[ret];
83 	if (method >= methods->num_methods)
84 		return NULL;
85 
86 	return methods->methods[method];
87 }
88 
89 void uverbs_uobject_get(struct ib_uobject *uobject)
90 {
91 	kref_get(&uobject->ref);
92 }
93 
94 static void uverbs_uobject_free(struct kref *ref)
95 {
96 	struct ib_uobject *uobj =
97 		container_of(ref, struct ib_uobject, ref);
98 
99 	if (uobj->type->type_class->needs_kfree_rcu)
100 		kfree_rcu(uobj, rcu);
101 	else
102 		kfree(uobj);
103 }
104 
105 void uverbs_uobject_put(struct ib_uobject *uobject)
106 {
107 	kref_put(&uobject->ref, uverbs_uobject_free);
108 }
109 
110 static int uverbs_try_lock_object(struct ib_uobject *uobj, bool exclusive)
111 {
112 	/*
113 	 * When a shared access is required, we use a positive counter. Each
114 	 * shared access request checks that the value != -1 and increment it.
115 	 * Exclusive access is required for operations like write or destroy.
116 	 * In exclusive access mode, we check that the counter is zero (nobody
117 	 * claimed this object) and we set it to -1. Releasing a shared access
118 	 * lock is done simply by decreasing the counter. As for exclusive
119 	 * access locks, since only a single one of them is is allowed
120 	 * concurrently, setting the counter to zero is enough for releasing
121 	 * this lock.
122 	 */
123 	if (!exclusive)
124 		return __atomic_add_unless(&uobj->usecnt, 1, -1) == -1 ?
125 			-EBUSY : 0;
126 
127 	/* lock is either WRITE or DESTROY - should be exclusive */
128 	return atomic_cmpxchg(&uobj->usecnt, 0, -1) == 0 ? 0 : -EBUSY;
129 }
130 
131 static struct ib_uobject *alloc_uobj(struct ib_ucontext *context,
132 				     const struct uverbs_obj_type *type)
133 {
134 	struct ib_uobject *uobj = kzalloc(type->obj_size, GFP_KERNEL);
135 
136 	if (!uobj)
137 		return ERR_PTR(-ENOMEM);
138 	/*
139 	 * user_handle should be filled by the handler,
140 	 * The object is added to the list in the commit stage.
141 	 */
142 	uobj->context = context;
143 	uobj->type = type;
144 	/*
145 	 * Allocated objects start out as write locked to deny any other
146 	 * syscalls from accessing them until they are committed. See
147 	 * rdma_alloc_commit_uobject
148 	 */
149 	atomic_set(&uobj->usecnt, -1);
150 	kref_init(&uobj->ref);
151 
152 	return uobj;
153 }
154 
155 static int idr_add_uobj(struct ib_uobject *uobj)
156 {
157 	int ret;
158 
159 	idr_preload(GFP_KERNEL);
160 	spin_lock(&uobj->context->ufile->idr_lock);
161 
162 	/*
163 	 * We start with allocating an idr pointing to NULL. This represents an
164 	 * object which isn't initialized yet. We'll replace it later on with
165 	 * the real object once we commit.
166 	 */
167 	ret = idr_alloc(&uobj->context->ufile->idr, NULL, 0,
168 			min_t(unsigned long, U32_MAX - 1, INT_MAX), GFP_NOWAIT);
169 	if (ret >= 0)
170 		uobj->id = ret;
171 
172 	spin_unlock(&uobj->context->ufile->idr_lock);
173 	idr_preload_end();
174 
175 	return ret < 0 ? ret : 0;
176 }
177 
178 /*
179  * It only removes it from the uobjects list, uverbs_uobject_put() is still
180  * required.
181  */
182 static void uverbs_idr_remove_uobj(struct ib_uobject *uobj)
183 {
184 	spin_lock(&uobj->context->ufile->idr_lock);
185 	idr_remove(&uobj->context->ufile->idr, uobj->id);
186 	spin_unlock(&uobj->context->ufile->idr_lock);
187 }
188 
189 /* Returns the ib_uobject or an error. The caller should check for IS_ERR. */
190 static struct ib_uobject *lookup_get_idr_uobject(const struct uverbs_obj_type *type,
191 						 struct ib_ucontext *ucontext,
192 						 int id, bool exclusive)
193 {
194 	struct ib_uobject *uobj;
195 
196 	rcu_read_lock();
197 	/* object won't be released as we're protected in rcu */
198 	uobj = idr_find(&ucontext->ufile->idr, id);
199 	if (!uobj) {
200 		uobj = ERR_PTR(-ENOENT);
201 		goto free;
202 	}
203 
204 	/*
205 	 * The idr_find is guaranteed to return a pointer to something that
206 	 * isn't freed yet, or NULL, as the free after idr_remove goes through
207 	 * kfree_rcu(). However the object may still have been released and
208 	 * kfree() could be called at any time.
209 	 */
210 	if (!kref_get_unless_zero(&uobj->ref))
211 		uobj = ERR_PTR(-ENOENT);
212 
213 free:
214 	rcu_read_unlock();
215 	return uobj;
216 }
217 
218 static struct ib_uobject *lookup_get_fd_uobject(const struct uverbs_obj_type *type,
219 						struct ib_ucontext *ucontext,
220 						int id, bool exclusive)
221 {
222 	struct file *f;
223 	struct ib_uobject *uobject;
224 	const struct uverbs_obj_fd_type *fd_type =
225 		container_of(type, struct uverbs_obj_fd_type, type);
226 
227 	if (exclusive)
228 		return ERR_PTR(-EOPNOTSUPP);
229 
230 	f = fget(id);
231 	if (!f)
232 		return ERR_PTR(-EBADF);
233 
234 	uobject = f->private_data;
235 	/*
236 	 * fget(id) ensures we are not currently running uverbs_close_fd,
237 	 * and the caller is expected to ensure that uverbs_close_fd is never
238 	 * done while a call top lookup is possible.
239 	 */
240 	if (f->f_op != fd_type->fops) {
241 		fput(f);
242 		return ERR_PTR(-EBADF);
243 	}
244 
245 	uverbs_uobject_get(uobject);
246 	return uobject;
247 }
248 
249 struct ib_uobject *rdma_lookup_get_uobject(const struct uverbs_obj_type *type,
250 					   struct ib_ucontext *ucontext,
251 					   int id, bool exclusive)
252 {
253 	struct ib_uobject *uobj;
254 	int ret;
255 
256 	uobj = type->type_class->lookup_get(type, ucontext, id, exclusive);
257 	if (IS_ERR(uobj))
258 		return uobj;
259 
260 	if (uobj->type != type) {
261 		ret = -EINVAL;
262 		goto free;
263 	}
264 
265 	ret = uverbs_try_lock_object(uobj, exclusive);
266 	if (ret) {
267 		WARN(ucontext->cleanup_reason,
268 		     "ib_uverbs: Trying to lookup_get while cleanup context\n");
269 		goto free;
270 	}
271 
272 	return uobj;
273 free:
274 	uobj->type->type_class->lookup_put(uobj, exclusive);
275 	uverbs_uobject_put(uobj);
276 	return ERR_PTR(ret);
277 }
278 
279 static struct ib_uobject *alloc_begin_idr_uobject(const struct uverbs_obj_type *type,
280 						  struct ib_ucontext *ucontext)
281 {
282 	int ret;
283 	struct ib_uobject *uobj;
284 
285 	uobj = alloc_uobj(ucontext, type);
286 	if (IS_ERR(uobj))
287 		return uobj;
288 
289 	ret = idr_add_uobj(uobj);
290 	if (ret)
291 		goto uobj_put;
292 
293 	ret = ib_rdmacg_try_charge(&uobj->cg_obj, ucontext->device,
294 				   RDMACG_RESOURCE_HCA_OBJECT);
295 	if (ret)
296 		goto idr_remove;
297 
298 	return uobj;
299 
300 idr_remove:
301 	uverbs_idr_remove_uobj(uobj);
302 uobj_put:
303 	uverbs_uobject_put(uobj);
304 	return ERR_PTR(ret);
305 }
306 
307 static struct ib_uobject *alloc_begin_fd_uobject(const struct uverbs_obj_type *type,
308 						 struct ib_ucontext *ucontext)
309 {
310 	const struct uverbs_obj_fd_type *fd_type =
311 		container_of(type, struct uverbs_obj_fd_type, type);
312 	int new_fd;
313 	struct ib_uobject *uobj;
314 	struct ib_uobject_file *uobj_file;
315 	struct file *filp;
316 
317 	new_fd = get_unused_fd_flags(O_CLOEXEC);
318 	if (new_fd < 0)
319 		return ERR_PTR(new_fd);
320 
321 	uobj = alloc_uobj(ucontext, type);
322 	if (IS_ERR(uobj)) {
323 		put_unused_fd(new_fd);
324 		return uobj;
325 	}
326 
327 	uobj_file = container_of(uobj, struct ib_uobject_file, uobj);
328 	filp = anon_inode_getfile(fd_type->name,
329 				  fd_type->fops,
330 				  uobj_file,
331 				  fd_type->flags);
332 	if (IS_ERR(filp)) {
333 		put_unused_fd(new_fd);
334 		uverbs_uobject_put(uobj);
335 		return (void *)filp;
336 	}
337 
338 	uobj_file->uobj.id = new_fd;
339 	uobj_file->uobj.object = filp;
340 	uobj_file->ufile = ucontext->ufile;
341 	INIT_LIST_HEAD(&uobj->list);
342 	kref_get(&uobj_file->ufile->ref);
343 
344 	return uobj;
345 }
346 
347 struct ib_uobject *rdma_alloc_begin_uobject(const struct uverbs_obj_type *type,
348 					    struct ib_ucontext *ucontext)
349 {
350 	return type->type_class->alloc_begin(type, ucontext);
351 }
352 
353 static int __must_check remove_commit_idr_uobject(struct ib_uobject *uobj,
354 						  enum rdma_remove_reason why)
355 {
356 	const struct uverbs_obj_idr_type *idr_type =
357 		container_of(uobj->type, struct uverbs_obj_idr_type,
358 			     type);
359 	int ret = idr_type->destroy_object(uobj, why);
360 
361 	/*
362 	 * We can only fail gracefully if the user requested to destroy the
363 	 * object. In the rest of the cases, just remove whatever you can.
364 	 */
365 	if (why == RDMA_REMOVE_DESTROY && ret)
366 		return ret;
367 
368 	ib_rdmacg_uncharge(&uobj->cg_obj, uobj->context->device,
369 			   RDMACG_RESOURCE_HCA_OBJECT);
370 	uverbs_idr_remove_uobj(uobj);
371 
372 	return ret;
373 }
374 
375 static void alloc_abort_fd_uobject(struct ib_uobject *uobj)
376 {
377 	struct ib_uobject_file *uobj_file =
378 		container_of(uobj, struct ib_uobject_file, uobj);
379 	struct file *filp = uobj->object;
380 	int id = uobj_file->uobj.id;
381 
382 	/* Unsuccessful NEW */
383 	fput(filp);
384 	put_unused_fd(id);
385 }
386 
387 static int __must_check remove_commit_fd_uobject(struct ib_uobject *uobj,
388 						 enum rdma_remove_reason why)
389 {
390 	const struct uverbs_obj_fd_type *fd_type =
391 		container_of(uobj->type, struct uverbs_obj_fd_type, type);
392 	struct ib_uobject_file *uobj_file =
393 		container_of(uobj, struct ib_uobject_file, uobj);
394 	int ret = fd_type->context_closed(uobj_file, why);
395 
396 	if (why == RDMA_REMOVE_DESTROY && ret)
397 		return ret;
398 
399 	if (why == RDMA_REMOVE_DURING_CLEANUP) {
400 		alloc_abort_fd_uobject(uobj);
401 		return ret;
402 	}
403 
404 	uobj_file->uobj.context = NULL;
405 	return ret;
406 }
407 
408 static void assert_uverbs_usecnt(struct ib_uobject *uobj, bool exclusive)
409 {
410 #ifdef CONFIG_LOCKDEP
411 	if (exclusive)
412 		WARN_ON(atomic_read(&uobj->usecnt) != -1);
413 	else
414 		WARN_ON(atomic_read(&uobj->usecnt) <= 0);
415 #endif
416 }
417 
418 static int __must_check _rdma_remove_commit_uobject(struct ib_uobject *uobj,
419 						    enum rdma_remove_reason why)
420 {
421 	int ret;
422 	struct ib_ucontext *ucontext = uobj->context;
423 
424 	ret = uobj->type->type_class->remove_commit(uobj, why);
425 	if (ret && why == RDMA_REMOVE_DESTROY) {
426 		/* We couldn't remove the object, so just unlock the uobject */
427 		atomic_set(&uobj->usecnt, 0);
428 		uobj->type->type_class->lookup_put(uobj, true);
429 	} else {
430 		mutex_lock(&ucontext->uobjects_lock);
431 		list_del(&uobj->list);
432 		mutex_unlock(&ucontext->uobjects_lock);
433 		/* put the ref we took when we created the object */
434 		uverbs_uobject_put(uobj);
435 	}
436 
437 	return ret;
438 }
439 
440 /* This is called only for user requested DESTROY reasons */
441 int __must_check rdma_remove_commit_uobject(struct ib_uobject *uobj)
442 {
443 	int ret;
444 	struct ib_ucontext *ucontext = uobj->context;
445 
446 	/* put the ref count we took at lookup_get */
447 	uverbs_uobject_put(uobj);
448 	/* Cleanup is running. Calling this should have been impossible */
449 	if (!down_read_trylock(&ucontext->cleanup_rwsem)) {
450 		WARN(true, "ib_uverbs: Cleanup is running while removing an uobject\n");
451 		return 0;
452 	}
453 	assert_uverbs_usecnt(uobj, true);
454 	ret = _rdma_remove_commit_uobject(uobj, RDMA_REMOVE_DESTROY);
455 
456 	up_read(&ucontext->cleanup_rwsem);
457 	return ret;
458 }
459 
460 static int null_obj_type_class_remove_commit(struct ib_uobject *uobj,
461 					     enum rdma_remove_reason why)
462 {
463 	return 0;
464 }
465 
466 static const struct uverbs_obj_type null_obj_type = {
467 	.type_class = &((const struct uverbs_obj_type_class){
468 			.remove_commit = null_obj_type_class_remove_commit,
469 			/* be cautious */
470 			.needs_kfree_rcu = true}),
471 };
472 
473 int rdma_explicit_destroy(struct ib_uobject *uobject)
474 {
475 	int ret;
476 	struct ib_ucontext *ucontext = uobject->context;
477 
478 	/* Cleanup is running. Calling this should have been impossible */
479 	if (!down_read_trylock(&ucontext->cleanup_rwsem)) {
480 		WARN(true, "ib_uverbs: Cleanup is running while removing an uobject\n");
481 		return 0;
482 	}
483 	assert_uverbs_usecnt(uobject, true);
484 	ret = uobject->type->type_class->remove_commit(uobject,
485 						       RDMA_REMOVE_DESTROY);
486 	if (ret)
487 		goto out;
488 
489 	uobject->type = &null_obj_type;
490 
491 out:
492 	up_read(&ucontext->cleanup_rwsem);
493 	return ret;
494 }
495 
496 static void alloc_commit_idr_uobject(struct ib_uobject *uobj)
497 {
498 	spin_lock(&uobj->context->ufile->idr_lock);
499 	/*
500 	 * We already allocated this IDR with a NULL object, so
501 	 * this shouldn't fail.
502 	 */
503 	WARN_ON(idr_replace(&uobj->context->ufile->idr,
504 			    uobj, uobj->id));
505 	spin_unlock(&uobj->context->ufile->idr_lock);
506 }
507 
508 static void alloc_commit_fd_uobject(struct ib_uobject *uobj)
509 {
510 	struct ib_uobject_file *uobj_file =
511 		container_of(uobj, struct ib_uobject_file, uobj);
512 
513 	fd_install(uobj_file->uobj.id, uobj->object);
514 	/* This shouldn't be used anymore. Use the file object instead */
515 	uobj_file->uobj.id = 0;
516 	/* Get another reference as we export this to the fops */
517 	uverbs_uobject_get(&uobj_file->uobj);
518 }
519 
520 int rdma_alloc_commit_uobject(struct ib_uobject *uobj)
521 {
522 	/* Cleanup is running. Calling this should have been impossible */
523 	if (!down_read_trylock(&uobj->context->cleanup_rwsem)) {
524 		int ret;
525 
526 		WARN(true, "ib_uverbs: Cleanup is running while allocating an uobject\n");
527 		ret = uobj->type->type_class->remove_commit(uobj,
528 							    RDMA_REMOVE_DURING_CLEANUP);
529 		if (ret)
530 			pr_warn("ib_uverbs: cleanup of idr object %d failed\n",
531 				uobj->id);
532 		return ret;
533 	}
534 
535 	/* matches atomic_set(-1) in alloc_uobj */
536 	assert_uverbs_usecnt(uobj, true);
537 	atomic_set(&uobj->usecnt, 0);
538 
539 	mutex_lock(&uobj->context->uobjects_lock);
540 	list_add(&uobj->list, &uobj->context->uobjects);
541 	mutex_unlock(&uobj->context->uobjects_lock);
542 
543 	uobj->type->type_class->alloc_commit(uobj);
544 	up_read(&uobj->context->cleanup_rwsem);
545 
546 	return 0;
547 }
548 
549 static void alloc_abort_idr_uobject(struct ib_uobject *uobj)
550 {
551 	uverbs_idr_remove_uobj(uobj);
552 	ib_rdmacg_uncharge(&uobj->cg_obj, uobj->context->device,
553 			   RDMACG_RESOURCE_HCA_OBJECT);
554 	uverbs_uobject_put(uobj);
555 }
556 
557 void rdma_alloc_abort_uobject(struct ib_uobject *uobj)
558 {
559 	uobj->type->type_class->alloc_abort(uobj);
560 }
561 
562 static void lookup_put_idr_uobject(struct ib_uobject *uobj, bool exclusive)
563 {
564 }
565 
566 static void lookup_put_fd_uobject(struct ib_uobject *uobj, bool exclusive)
567 {
568 	struct file *filp = uobj->object;
569 
570 	WARN_ON(exclusive);
571 	/* This indirectly calls uverbs_close_fd and free the object */
572 	fput(filp);
573 }
574 
575 void rdma_lookup_put_uobject(struct ib_uobject *uobj, bool exclusive)
576 {
577 	assert_uverbs_usecnt(uobj, exclusive);
578 	uobj->type->type_class->lookup_put(uobj, exclusive);
579 	/*
580 	 * In order to unlock an object, either decrease its usecnt for
581 	 * read access or zero it in case of exclusive access. See
582 	 * uverbs_try_lock_object for locking schema information.
583 	 */
584 	if (!exclusive)
585 		atomic_dec(&uobj->usecnt);
586 	else
587 		atomic_set(&uobj->usecnt, 0);
588 
589 	uverbs_uobject_put(uobj);
590 }
591 
592 const struct uverbs_obj_type_class uverbs_idr_class = {
593 	.alloc_begin = alloc_begin_idr_uobject,
594 	.lookup_get = lookup_get_idr_uobject,
595 	.alloc_commit = alloc_commit_idr_uobject,
596 	.alloc_abort = alloc_abort_idr_uobject,
597 	.lookup_put = lookup_put_idr_uobject,
598 	.remove_commit = remove_commit_idr_uobject,
599 	/*
600 	 * When we destroy an object, we first just lock it for WRITE and
601 	 * actually DESTROY it in the finalize stage. So, the problematic
602 	 * scenario is when we just started the finalize stage of the
603 	 * destruction (nothing was executed yet). Now, the other thread
604 	 * fetched the object for READ access, but it didn't lock it yet.
605 	 * The DESTROY thread continues and starts destroying the object.
606 	 * When the other thread continue - without the RCU, it would
607 	 * access freed memory. However, the rcu_read_lock delays the free
608 	 * until the rcu_read_lock of the READ operation quits. Since the
609 	 * exclusive lock of the object is still taken by the DESTROY flow, the
610 	 * READ operation will get -EBUSY and it'll just bail out.
611 	 */
612 	.needs_kfree_rcu = true,
613 };
614 
615 static void _uverbs_close_fd(struct ib_uobject_file *uobj_file)
616 {
617 	struct ib_ucontext *ucontext;
618 	struct ib_uverbs_file *ufile = uobj_file->ufile;
619 	int ret;
620 
621 	mutex_lock(&uobj_file->ufile->cleanup_mutex);
622 
623 	/* uobject was either already cleaned up or is cleaned up right now anyway */
624 	if (!uobj_file->uobj.context ||
625 	    !down_read_trylock(&uobj_file->uobj.context->cleanup_rwsem))
626 		goto unlock;
627 
628 	ucontext = uobj_file->uobj.context;
629 	ret = _rdma_remove_commit_uobject(&uobj_file->uobj, RDMA_REMOVE_CLOSE);
630 	up_read(&ucontext->cleanup_rwsem);
631 	if (ret)
632 		pr_warn("uverbs: unable to clean up uobject file in uverbs_close_fd.\n");
633 unlock:
634 	mutex_unlock(&ufile->cleanup_mutex);
635 }
636 
637 void uverbs_close_fd(struct file *f)
638 {
639 	struct ib_uobject_file *uobj_file = f->private_data;
640 	struct kref *uverbs_file_ref = &uobj_file->ufile->ref;
641 
642 	_uverbs_close_fd(uobj_file);
643 	uverbs_uobject_put(&uobj_file->uobj);
644 	kref_put(uverbs_file_ref, ib_uverbs_release_file);
645 }
646 
647 void uverbs_cleanup_ucontext(struct ib_ucontext *ucontext, bool device_removed)
648 {
649 	enum rdma_remove_reason reason = device_removed ?
650 		RDMA_REMOVE_DRIVER_REMOVE : RDMA_REMOVE_CLOSE;
651 	unsigned int cur_order = 0;
652 
653 	ucontext->cleanup_reason = reason;
654 	/*
655 	 * Waits for all remove_commit and alloc_commit to finish. Logically, We
656 	 * want to hold this forever as the context is going to be destroyed,
657 	 * but we'll release it since it causes a "held lock freed" BUG message.
658 	 */
659 	down_write(&ucontext->cleanup_rwsem);
660 
661 	while (!list_empty(&ucontext->uobjects)) {
662 		struct ib_uobject *obj, *next_obj;
663 		unsigned int next_order = UINT_MAX;
664 
665 		/*
666 		 * This shouldn't run while executing other commands on this
667 		 * context. Thus, the only thing we should take care of is
668 		 * releasing a FD while traversing this list. The FD could be
669 		 * closed and released from the _release fop of this FD.
670 		 * In order to mitigate this, we add a lock.
671 		 * We take and release the lock per order traversal in order
672 		 * to let other threads (which might still use the FDs) chance
673 		 * to run.
674 		 */
675 		mutex_lock(&ucontext->uobjects_lock);
676 		list_for_each_entry_safe(obj, next_obj, &ucontext->uobjects,
677 					 list) {
678 			if (obj->type->destroy_order == cur_order) {
679 				int ret;
680 
681 				/*
682 				 * if we hit this WARN_ON, that means we are
683 				 * racing with a lookup_get.
684 				 */
685 				WARN_ON(uverbs_try_lock_object(obj, true));
686 				ret = obj->type->type_class->remove_commit(obj,
687 									   reason);
688 				list_del(&obj->list);
689 				if (ret)
690 					pr_warn("ib_uverbs: failed to remove uobject id %d order %u\n",
691 						obj->id, cur_order);
692 				/* put the ref we took when we created the object */
693 				uverbs_uobject_put(obj);
694 			} else {
695 				next_order = min(next_order,
696 						 obj->type->destroy_order);
697 			}
698 		}
699 		mutex_unlock(&ucontext->uobjects_lock);
700 		cur_order = next_order;
701 	}
702 	up_write(&ucontext->cleanup_rwsem);
703 }
704 
705 void uverbs_initialize_ucontext(struct ib_ucontext *ucontext)
706 {
707 	ucontext->cleanup_reason = 0;
708 	mutex_init(&ucontext->uobjects_lock);
709 	INIT_LIST_HEAD(&ucontext->uobjects);
710 	init_rwsem(&ucontext->cleanup_rwsem);
711 }
712 
713 const struct uverbs_obj_type_class uverbs_fd_class = {
714 	.alloc_begin = alloc_begin_fd_uobject,
715 	.lookup_get = lookup_get_fd_uobject,
716 	.alloc_commit = alloc_commit_fd_uobject,
717 	.alloc_abort = alloc_abort_fd_uobject,
718 	.lookup_put = lookup_put_fd_uobject,
719 	.remove_commit = remove_commit_fd_uobject,
720 	.needs_kfree_rcu = false,
721 };
722 
723 struct ib_uobject *uverbs_get_uobject_from_context(const struct uverbs_obj_type *type_attrs,
724 						   struct ib_ucontext *ucontext,
725 						   enum uverbs_obj_access access,
726 						   int id)
727 {
728 	switch (access) {
729 	case UVERBS_ACCESS_READ:
730 		return rdma_lookup_get_uobject(type_attrs, ucontext, id, false);
731 	case UVERBS_ACCESS_DESTROY:
732 	case UVERBS_ACCESS_WRITE:
733 		return rdma_lookup_get_uobject(type_attrs, ucontext, id, true);
734 	case UVERBS_ACCESS_NEW:
735 		return rdma_alloc_begin_uobject(type_attrs, ucontext);
736 	default:
737 		WARN_ON(true);
738 		return ERR_PTR(-EOPNOTSUPP);
739 	}
740 }
741 
742 int uverbs_finalize_object(struct ib_uobject *uobj,
743 			   enum uverbs_obj_access access,
744 			   bool commit)
745 {
746 	int ret = 0;
747 
748 	/*
749 	 * refcounts should be handled at the object level and not at the
750 	 * uobject level. Refcounts of the objects themselves are done in
751 	 * handlers.
752 	 */
753 
754 	switch (access) {
755 	case UVERBS_ACCESS_READ:
756 		rdma_lookup_put_uobject(uobj, false);
757 		break;
758 	case UVERBS_ACCESS_WRITE:
759 		rdma_lookup_put_uobject(uobj, true);
760 		break;
761 	case UVERBS_ACCESS_DESTROY:
762 		if (commit)
763 			ret = rdma_remove_commit_uobject(uobj);
764 		else
765 			rdma_lookup_put_uobject(uobj, true);
766 		break;
767 	case UVERBS_ACCESS_NEW:
768 		if (commit)
769 			ret = rdma_alloc_commit_uobject(uobj);
770 		else
771 			rdma_alloc_abort_uobject(uobj);
772 		break;
773 	default:
774 		WARN_ON(true);
775 		ret = -EOPNOTSUPP;
776 	}
777 
778 	return ret;
779 }
780 
781 int uverbs_finalize_objects(struct uverbs_attr_bundle *attrs_bundle,
782 			    struct uverbs_attr_spec_hash * const *spec_hash,
783 			    size_t num,
784 			    bool commit)
785 {
786 	unsigned int i;
787 	int ret = 0;
788 
789 	for (i = 0; i < num; i++) {
790 		struct uverbs_attr_bundle_hash *curr_bundle =
791 			&attrs_bundle->hash[i];
792 		const struct uverbs_attr_spec_hash *curr_spec_bucket =
793 			spec_hash[i];
794 		unsigned int j;
795 
796 		for (j = 0; j < curr_bundle->num_attrs; j++) {
797 			struct uverbs_attr *attr;
798 			const struct uverbs_attr_spec *spec;
799 
800 			if (!uverbs_attr_is_valid_in_hash(curr_bundle, j))
801 				continue;
802 
803 			attr = &curr_bundle->attrs[j];
804 			spec = &curr_spec_bucket->attrs[j];
805 
806 			if (spec->type == UVERBS_ATTR_TYPE_IDR ||
807 			    spec->type == UVERBS_ATTR_TYPE_FD) {
808 				int current_ret;
809 
810 				current_ret = uverbs_finalize_object(attr->obj_attr.uobject,
811 								     spec->obj.access,
812 								     commit);
813 				if (!ret)
814 					ret = current_ret;
815 			}
816 		}
817 	}
818 	return ret;
819 }
820