xref: /linux/drivers/infiniband/ulp/srp/ib_srp.c (revision cc1e6315e83db0e517dd9279050b88adc83a7eba)
1 /*
2  * Copyright (c) 2005 Cisco Systems.  All rights reserved.
3  *
4  * This software is available to you under a choice of one of two
5  * licenses.  You may choose to be licensed under the terms of the GNU
6  * General Public License (GPL) Version 2, available from the file
7  * COPYING in the main directory of this source tree, or the
8  * OpenIB.org BSD license below:
9  *
10  *     Redistribution and use in source and binary forms, with or
11  *     without modification, are permitted provided that the following
12  *     conditions are met:
13  *
14  *      - Redistributions of source code must retain the above
15  *        copyright notice, this list of conditions and the following
16  *        disclaimer.
17  *
18  *      - Redistributions in binary form must reproduce the above
19  *        copyright notice, this list of conditions and the following
20  *        disclaimer in the documentation and/or other materials
21  *        provided with the distribution.
22  *
23  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
24  * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
25  * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
26  * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
27  * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
28  * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
29  * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
30  * SOFTWARE.
31  */
32 
33 #define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
34 
35 #include <linux/module.h>
36 #include <linux/init.h>
37 #include <linux/slab.h>
38 #include <linux/err.h>
39 #include <linux/string.h>
40 #include <linux/parser.h>
41 #include <linux/random.h>
42 #include <linux/jiffies.h>
43 #include <linux/lockdep.h>
44 #include <linux/inet.h>
45 #include <rdma/ib_cache.h>
46 
47 #include <linux/atomic.h>
48 
49 #include <scsi/scsi.h>
50 #include <scsi/scsi_device.h>
51 #include <scsi/scsi_dbg.h>
52 #include <scsi/scsi_tcq.h>
53 #include <scsi/srp.h>
54 #include <scsi/scsi_transport_srp.h>
55 
56 #include "ib_srp.h"
57 
58 #define DRV_NAME	"ib_srp"
59 #define PFX		DRV_NAME ": "
60 
61 MODULE_AUTHOR("Roland Dreier");
62 MODULE_DESCRIPTION("InfiniBand SCSI RDMA Protocol initiator");
63 MODULE_LICENSE("Dual BSD/GPL");
64 
65 #if !defined(CONFIG_DYNAMIC_DEBUG)
66 #define DEFINE_DYNAMIC_DEBUG_METADATA(name, fmt)
67 #define DYNAMIC_DEBUG_BRANCH(descriptor) false
68 #endif
69 
70 static unsigned int srp_sg_tablesize;
71 static unsigned int cmd_sg_entries;
72 static unsigned int indirect_sg_entries;
73 static bool allow_ext_sg;
74 static bool prefer_fr = true;
75 static bool register_always = true;
76 static bool never_register;
77 static int topspin_workarounds = 1;
78 
79 module_param(srp_sg_tablesize, uint, 0444);
80 MODULE_PARM_DESC(srp_sg_tablesize, "Deprecated name for cmd_sg_entries");
81 
82 module_param(cmd_sg_entries, uint, 0444);
83 MODULE_PARM_DESC(cmd_sg_entries,
84 		 "Default number of gather/scatter entries in the SRP command (default is 12, max 255)");
85 
86 module_param(indirect_sg_entries, uint, 0444);
87 MODULE_PARM_DESC(indirect_sg_entries,
88 		 "Default max number of gather/scatter entries (default is 12, max is " __stringify(SG_MAX_SEGMENTS) ")");
89 
90 module_param(allow_ext_sg, bool, 0444);
91 MODULE_PARM_DESC(allow_ext_sg,
92 		  "Default behavior when there are more than cmd_sg_entries S/G entries after mapping; fails the request when false (default false)");
93 
94 module_param(topspin_workarounds, int, 0444);
95 MODULE_PARM_DESC(topspin_workarounds,
96 		 "Enable workarounds for Topspin/Cisco SRP target bugs if != 0");
97 
98 module_param(prefer_fr, bool, 0444);
99 MODULE_PARM_DESC(prefer_fr,
100 "Whether to use fast registration if both FMR and fast registration are supported");
101 
102 module_param(register_always, bool, 0444);
103 MODULE_PARM_DESC(register_always,
104 		 "Use memory registration even for contiguous memory regions");
105 
106 module_param(never_register, bool, 0444);
107 MODULE_PARM_DESC(never_register, "Never register memory");
108 
109 static const struct kernel_param_ops srp_tmo_ops;
110 
111 static int srp_reconnect_delay = 10;
112 module_param_cb(reconnect_delay, &srp_tmo_ops, &srp_reconnect_delay,
113 		S_IRUGO | S_IWUSR);
114 MODULE_PARM_DESC(reconnect_delay, "Time between successive reconnect attempts");
115 
116 static int srp_fast_io_fail_tmo = 15;
117 module_param_cb(fast_io_fail_tmo, &srp_tmo_ops, &srp_fast_io_fail_tmo,
118 		S_IRUGO | S_IWUSR);
119 MODULE_PARM_DESC(fast_io_fail_tmo,
120 		 "Number of seconds between the observation of a transport"
121 		 " layer error and failing all I/O. \"off\" means that this"
122 		 " functionality is disabled.");
123 
124 static int srp_dev_loss_tmo = 600;
125 module_param_cb(dev_loss_tmo, &srp_tmo_ops, &srp_dev_loss_tmo,
126 		S_IRUGO | S_IWUSR);
127 MODULE_PARM_DESC(dev_loss_tmo,
128 		 "Maximum number of seconds that the SRP transport should"
129 		 " insulate transport layer errors. After this time has been"
130 		 " exceeded the SCSI host is removed. Should be"
131 		 " between 1 and " __stringify(SCSI_DEVICE_BLOCK_MAX_TIMEOUT)
132 		 " if fast_io_fail_tmo has not been set. \"off\" means that"
133 		 " this functionality is disabled.");
134 
135 static unsigned ch_count;
136 module_param(ch_count, uint, 0444);
137 MODULE_PARM_DESC(ch_count,
138 		 "Number of RDMA channels to use for communication with an SRP target. Using more than one channel improves performance if the HCA supports multiple completion vectors. The default value is the minimum of four times the number of online CPU sockets and the number of completion vectors supported by the HCA.");
139 
140 static void srp_add_one(struct ib_device *device);
141 static void srp_remove_one(struct ib_device *device, void *client_data);
142 static void srp_recv_done(struct ib_cq *cq, struct ib_wc *wc);
143 static void srp_handle_qp_err(struct ib_cq *cq, struct ib_wc *wc,
144 		const char *opname);
145 static int srp_ib_cm_handler(struct ib_cm_id *cm_id,
146 			     const struct ib_cm_event *event);
147 static int srp_rdma_cm_handler(struct rdma_cm_id *cm_id,
148 			       struct rdma_cm_event *event);
149 
150 static struct scsi_transport_template *ib_srp_transport_template;
151 static struct workqueue_struct *srp_remove_wq;
152 
153 static struct ib_client srp_client = {
154 	.name   = "srp",
155 	.add    = srp_add_one,
156 	.remove = srp_remove_one
157 };
158 
159 static struct ib_sa_client srp_sa_client;
160 
161 static int srp_tmo_get(char *buffer, const struct kernel_param *kp)
162 {
163 	int tmo = *(int *)kp->arg;
164 
165 	if (tmo >= 0)
166 		return sprintf(buffer, "%d", tmo);
167 	else
168 		return sprintf(buffer, "off");
169 }
170 
171 static int srp_tmo_set(const char *val, const struct kernel_param *kp)
172 {
173 	int tmo, res;
174 
175 	res = srp_parse_tmo(&tmo, val);
176 	if (res)
177 		goto out;
178 
179 	if (kp->arg == &srp_reconnect_delay)
180 		res = srp_tmo_valid(tmo, srp_fast_io_fail_tmo,
181 				    srp_dev_loss_tmo);
182 	else if (kp->arg == &srp_fast_io_fail_tmo)
183 		res = srp_tmo_valid(srp_reconnect_delay, tmo, srp_dev_loss_tmo);
184 	else
185 		res = srp_tmo_valid(srp_reconnect_delay, srp_fast_io_fail_tmo,
186 				    tmo);
187 	if (res)
188 		goto out;
189 	*(int *)kp->arg = tmo;
190 
191 out:
192 	return res;
193 }
194 
195 static const struct kernel_param_ops srp_tmo_ops = {
196 	.get = srp_tmo_get,
197 	.set = srp_tmo_set,
198 };
199 
200 static inline struct srp_target_port *host_to_target(struct Scsi_Host *host)
201 {
202 	return (struct srp_target_port *) host->hostdata;
203 }
204 
205 static const char *srp_target_info(struct Scsi_Host *host)
206 {
207 	return host_to_target(host)->target_name;
208 }
209 
210 static int srp_target_is_topspin(struct srp_target_port *target)
211 {
212 	static const u8 topspin_oui[3] = { 0x00, 0x05, 0xad };
213 	static const u8 cisco_oui[3]   = { 0x00, 0x1b, 0x0d };
214 
215 	return topspin_workarounds &&
216 		(!memcmp(&target->ioc_guid, topspin_oui, sizeof topspin_oui) ||
217 		 !memcmp(&target->ioc_guid, cisco_oui, sizeof cisco_oui));
218 }
219 
220 static struct srp_iu *srp_alloc_iu(struct srp_host *host, size_t size,
221 				   gfp_t gfp_mask,
222 				   enum dma_data_direction direction)
223 {
224 	struct srp_iu *iu;
225 
226 	iu = kmalloc(sizeof *iu, gfp_mask);
227 	if (!iu)
228 		goto out;
229 
230 	iu->buf = kzalloc(size, gfp_mask);
231 	if (!iu->buf)
232 		goto out_free_iu;
233 
234 	iu->dma = ib_dma_map_single(host->srp_dev->dev, iu->buf, size,
235 				    direction);
236 	if (ib_dma_mapping_error(host->srp_dev->dev, iu->dma))
237 		goto out_free_buf;
238 
239 	iu->size      = size;
240 	iu->direction = direction;
241 
242 	return iu;
243 
244 out_free_buf:
245 	kfree(iu->buf);
246 out_free_iu:
247 	kfree(iu);
248 out:
249 	return NULL;
250 }
251 
252 static void srp_free_iu(struct srp_host *host, struct srp_iu *iu)
253 {
254 	if (!iu)
255 		return;
256 
257 	ib_dma_unmap_single(host->srp_dev->dev, iu->dma, iu->size,
258 			    iu->direction);
259 	kfree(iu->buf);
260 	kfree(iu);
261 }
262 
263 static void srp_qp_event(struct ib_event *event, void *context)
264 {
265 	pr_debug("QP event %s (%d)\n",
266 		 ib_event_msg(event->event), event->event);
267 }
268 
269 static int srp_init_ib_qp(struct srp_target_port *target,
270 			  struct ib_qp *qp)
271 {
272 	struct ib_qp_attr *attr;
273 	int ret;
274 
275 	attr = kmalloc(sizeof *attr, GFP_KERNEL);
276 	if (!attr)
277 		return -ENOMEM;
278 
279 	ret = ib_find_cached_pkey(target->srp_host->srp_dev->dev,
280 				  target->srp_host->port,
281 				  be16_to_cpu(target->ib_cm.pkey),
282 				  &attr->pkey_index);
283 	if (ret)
284 		goto out;
285 
286 	attr->qp_state        = IB_QPS_INIT;
287 	attr->qp_access_flags = (IB_ACCESS_REMOTE_READ |
288 				    IB_ACCESS_REMOTE_WRITE);
289 	attr->port_num        = target->srp_host->port;
290 
291 	ret = ib_modify_qp(qp, attr,
292 			   IB_QP_STATE		|
293 			   IB_QP_PKEY_INDEX	|
294 			   IB_QP_ACCESS_FLAGS	|
295 			   IB_QP_PORT);
296 
297 out:
298 	kfree(attr);
299 	return ret;
300 }
301 
302 static int srp_new_ib_cm_id(struct srp_rdma_ch *ch)
303 {
304 	struct srp_target_port *target = ch->target;
305 	struct ib_cm_id *new_cm_id;
306 
307 	new_cm_id = ib_create_cm_id(target->srp_host->srp_dev->dev,
308 				    srp_ib_cm_handler, ch);
309 	if (IS_ERR(new_cm_id))
310 		return PTR_ERR(new_cm_id);
311 
312 	if (ch->ib_cm.cm_id)
313 		ib_destroy_cm_id(ch->ib_cm.cm_id);
314 	ch->ib_cm.cm_id = new_cm_id;
315 	if (rdma_cap_opa_ah(target->srp_host->srp_dev->dev,
316 			    target->srp_host->port))
317 		ch->ib_cm.path.rec_type = SA_PATH_REC_TYPE_OPA;
318 	else
319 		ch->ib_cm.path.rec_type = SA_PATH_REC_TYPE_IB;
320 	ch->ib_cm.path.sgid = target->sgid;
321 	ch->ib_cm.path.dgid = target->ib_cm.orig_dgid;
322 	ch->ib_cm.path.pkey = target->ib_cm.pkey;
323 	ch->ib_cm.path.service_id = target->ib_cm.service_id;
324 
325 	return 0;
326 }
327 
328 static int srp_new_rdma_cm_id(struct srp_rdma_ch *ch)
329 {
330 	struct srp_target_port *target = ch->target;
331 	struct rdma_cm_id *new_cm_id;
332 	int ret;
333 
334 	new_cm_id = rdma_create_id(target->net, srp_rdma_cm_handler, ch,
335 				   RDMA_PS_TCP, IB_QPT_RC);
336 	if (IS_ERR(new_cm_id)) {
337 		ret = PTR_ERR(new_cm_id);
338 		new_cm_id = NULL;
339 		goto out;
340 	}
341 
342 	init_completion(&ch->done);
343 	ret = rdma_resolve_addr(new_cm_id, target->rdma_cm.src_specified ?
344 				(struct sockaddr *)&target->rdma_cm.src : NULL,
345 				(struct sockaddr *)&target->rdma_cm.dst,
346 				SRP_PATH_REC_TIMEOUT_MS);
347 	if (ret) {
348 		pr_err("No route available from %pIS to %pIS (%d)\n",
349 		       &target->rdma_cm.src, &target->rdma_cm.dst, ret);
350 		goto out;
351 	}
352 	ret = wait_for_completion_interruptible(&ch->done);
353 	if (ret < 0)
354 		goto out;
355 
356 	ret = ch->status;
357 	if (ret) {
358 		pr_err("Resolving address %pIS failed (%d)\n",
359 		       &target->rdma_cm.dst, ret);
360 		goto out;
361 	}
362 
363 	swap(ch->rdma_cm.cm_id, new_cm_id);
364 
365 out:
366 	if (new_cm_id)
367 		rdma_destroy_id(new_cm_id);
368 
369 	return ret;
370 }
371 
372 static int srp_new_cm_id(struct srp_rdma_ch *ch)
373 {
374 	struct srp_target_port *target = ch->target;
375 
376 	return target->using_rdma_cm ? srp_new_rdma_cm_id(ch) :
377 		srp_new_ib_cm_id(ch);
378 }
379 
380 static struct ib_fmr_pool *srp_alloc_fmr_pool(struct srp_target_port *target)
381 {
382 	struct srp_device *dev = target->srp_host->srp_dev;
383 	struct ib_fmr_pool_param fmr_param;
384 
385 	memset(&fmr_param, 0, sizeof(fmr_param));
386 	fmr_param.pool_size	    = target->mr_pool_size;
387 	fmr_param.dirty_watermark   = fmr_param.pool_size / 4;
388 	fmr_param.cache		    = 1;
389 	fmr_param.max_pages_per_fmr = dev->max_pages_per_mr;
390 	fmr_param.page_shift	    = ilog2(dev->mr_page_size);
391 	fmr_param.access	    = (IB_ACCESS_LOCAL_WRITE |
392 				       IB_ACCESS_REMOTE_WRITE |
393 				       IB_ACCESS_REMOTE_READ);
394 
395 	return ib_create_fmr_pool(dev->pd, &fmr_param);
396 }
397 
398 /**
399  * srp_destroy_fr_pool() - free the resources owned by a pool
400  * @pool: Fast registration pool to be destroyed.
401  */
402 static void srp_destroy_fr_pool(struct srp_fr_pool *pool)
403 {
404 	int i;
405 	struct srp_fr_desc *d;
406 
407 	if (!pool)
408 		return;
409 
410 	for (i = 0, d = &pool->desc[0]; i < pool->size; i++, d++) {
411 		if (d->mr)
412 			ib_dereg_mr(d->mr);
413 	}
414 	kfree(pool);
415 }
416 
417 /**
418  * srp_create_fr_pool() - allocate and initialize a pool for fast registration
419  * @device:            IB device to allocate fast registration descriptors for.
420  * @pd:                Protection domain associated with the FR descriptors.
421  * @pool_size:         Number of descriptors to allocate.
422  * @max_page_list_len: Maximum fast registration work request page list length.
423  */
424 static struct srp_fr_pool *srp_create_fr_pool(struct ib_device *device,
425 					      struct ib_pd *pd, int pool_size,
426 					      int max_page_list_len)
427 {
428 	struct srp_fr_pool *pool;
429 	struct srp_fr_desc *d;
430 	struct ib_mr *mr;
431 	int i, ret = -EINVAL;
432 	enum ib_mr_type mr_type;
433 
434 	if (pool_size <= 0)
435 		goto err;
436 	ret = -ENOMEM;
437 	pool = kzalloc(sizeof(struct srp_fr_pool) +
438 		       pool_size * sizeof(struct srp_fr_desc), GFP_KERNEL);
439 	if (!pool)
440 		goto err;
441 	pool->size = pool_size;
442 	pool->max_page_list_len = max_page_list_len;
443 	spin_lock_init(&pool->lock);
444 	INIT_LIST_HEAD(&pool->free_list);
445 
446 	if (device->attrs.device_cap_flags & IB_DEVICE_SG_GAPS_REG)
447 		mr_type = IB_MR_TYPE_SG_GAPS;
448 	else
449 		mr_type = IB_MR_TYPE_MEM_REG;
450 
451 	for (i = 0, d = &pool->desc[0]; i < pool->size; i++, d++) {
452 		mr = ib_alloc_mr(pd, mr_type, max_page_list_len);
453 		if (IS_ERR(mr)) {
454 			ret = PTR_ERR(mr);
455 			if (ret == -ENOMEM)
456 				pr_info("%s: ib_alloc_mr() failed. Try to reduce max_cmd_per_lun, max_sect or ch_count\n",
457 					dev_name(&device->dev));
458 			goto destroy_pool;
459 		}
460 		d->mr = mr;
461 		list_add_tail(&d->entry, &pool->free_list);
462 	}
463 
464 out:
465 	return pool;
466 
467 destroy_pool:
468 	srp_destroy_fr_pool(pool);
469 
470 err:
471 	pool = ERR_PTR(ret);
472 	goto out;
473 }
474 
475 /**
476  * srp_fr_pool_get() - obtain a descriptor suitable for fast registration
477  * @pool: Pool to obtain descriptor from.
478  */
479 static struct srp_fr_desc *srp_fr_pool_get(struct srp_fr_pool *pool)
480 {
481 	struct srp_fr_desc *d = NULL;
482 	unsigned long flags;
483 
484 	spin_lock_irqsave(&pool->lock, flags);
485 	if (!list_empty(&pool->free_list)) {
486 		d = list_first_entry(&pool->free_list, typeof(*d), entry);
487 		list_del(&d->entry);
488 	}
489 	spin_unlock_irqrestore(&pool->lock, flags);
490 
491 	return d;
492 }
493 
494 /**
495  * srp_fr_pool_put() - put an FR descriptor back in the free list
496  * @pool: Pool the descriptor was allocated from.
497  * @desc: Pointer to an array of fast registration descriptor pointers.
498  * @n:    Number of descriptors to put back.
499  *
500  * Note: The caller must already have queued an invalidation request for
501  * desc->mr->rkey before calling this function.
502  */
503 static void srp_fr_pool_put(struct srp_fr_pool *pool, struct srp_fr_desc **desc,
504 			    int n)
505 {
506 	unsigned long flags;
507 	int i;
508 
509 	spin_lock_irqsave(&pool->lock, flags);
510 	for (i = 0; i < n; i++)
511 		list_add(&desc[i]->entry, &pool->free_list);
512 	spin_unlock_irqrestore(&pool->lock, flags);
513 }
514 
515 static struct srp_fr_pool *srp_alloc_fr_pool(struct srp_target_port *target)
516 {
517 	struct srp_device *dev = target->srp_host->srp_dev;
518 
519 	return srp_create_fr_pool(dev->dev, dev->pd, target->mr_pool_size,
520 				  dev->max_pages_per_mr);
521 }
522 
523 /**
524  * srp_destroy_qp() - destroy an RDMA queue pair
525  * @ch: SRP RDMA channel.
526  *
527  * Drain the qp before destroying it.  This avoids that the receive
528  * completion handler can access the queue pair while it is
529  * being destroyed.
530  */
531 static void srp_destroy_qp(struct srp_rdma_ch *ch)
532 {
533 	spin_lock_irq(&ch->lock);
534 	ib_process_cq_direct(ch->send_cq, -1);
535 	spin_unlock_irq(&ch->lock);
536 
537 	ib_drain_qp(ch->qp);
538 	ib_destroy_qp(ch->qp);
539 }
540 
541 static int srp_create_ch_ib(struct srp_rdma_ch *ch)
542 {
543 	struct srp_target_port *target = ch->target;
544 	struct srp_device *dev = target->srp_host->srp_dev;
545 	struct ib_qp_init_attr *init_attr;
546 	struct ib_cq *recv_cq, *send_cq;
547 	struct ib_qp *qp;
548 	struct ib_fmr_pool *fmr_pool = NULL;
549 	struct srp_fr_pool *fr_pool = NULL;
550 	const int m = 1 + dev->use_fast_reg * target->mr_per_cmd * 2;
551 	int ret;
552 
553 	init_attr = kzalloc(sizeof *init_attr, GFP_KERNEL);
554 	if (!init_attr)
555 		return -ENOMEM;
556 
557 	/* queue_size + 1 for ib_drain_rq() */
558 	recv_cq = ib_alloc_cq(dev->dev, ch, target->queue_size + 1,
559 				ch->comp_vector, IB_POLL_SOFTIRQ);
560 	if (IS_ERR(recv_cq)) {
561 		ret = PTR_ERR(recv_cq);
562 		goto err;
563 	}
564 
565 	send_cq = ib_alloc_cq(dev->dev, ch, m * target->queue_size,
566 				ch->comp_vector, IB_POLL_DIRECT);
567 	if (IS_ERR(send_cq)) {
568 		ret = PTR_ERR(send_cq);
569 		goto err_recv_cq;
570 	}
571 
572 	init_attr->event_handler       = srp_qp_event;
573 	init_attr->cap.max_send_wr     = m * target->queue_size;
574 	init_attr->cap.max_recv_wr     = target->queue_size + 1;
575 	init_attr->cap.max_recv_sge    = 1;
576 	init_attr->cap.max_send_sge    = 1;
577 	init_attr->sq_sig_type         = IB_SIGNAL_REQ_WR;
578 	init_attr->qp_type             = IB_QPT_RC;
579 	init_attr->send_cq             = send_cq;
580 	init_attr->recv_cq             = recv_cq;
581 
582 	if (target->using_rdma_cm) {
583 		ret = rdma_create_qp(ch->rdma_cm.cm_id, dev->pd, init_attr);
584 		qp = ch->rdma_cm.cm_id->qp;
585 	} else {
586 		qp = ib_create_qp(dev->pd, init_attr);
587 		if (!IS_ERR(qp)) {
588 			ret = srp_init_ib_qp(target, qp);
589 			if (ret)
590 				ib_destroy_qp(qp);
591 		} else {
592 			ret = PTR_ERR(qp);
593 		}
594 	}
595 	if (ret) {
596 		pr_err("QP creation failed for dev %s: %d\n",
597 		       dev_name(&dev->dev->dev), ret);
598 		goto err_send_cq;
599 	}
600 
601 	if (dev->use_fast_reg) {
602 		fr_pool = srp_alloc_fr_pool(target);
603 		if (IS_ERR(fr_pool)) {
604 			ret = PTR_ERR(fr_pool);
605 			shost_printk(KERN_WARNING, target->scsi_host, PFX
606 				     "FR pool allocation failed (%d)\n", ret);
607 			goto err_qp;
608 		}
609 	} else if (dev->use_fmr) {
610 		fmr_pool = srp_alloc_fmr_pool(target);
611 		if (IS_ERR(fmr_pool)) {
612 			ret = PTR_ERR(fmr_pool);
613 			shost_printk(KERN_WARNING, target->scsi_host, PFX
614 				     "FMR pool allocation failed (%d)\n", ret);
615 			goto err_qp;
616 		}
617 	}
618 
619 	if (ch->qp)
620 		srp_destroy_qp(ch);
621 	if (ch->recv_cq)
622 		ib_free_cq(ch->recv_cq);
623 	if (ch->send_cq)
624 		ib_free_cq(ch->send_cq);
625 
626 	ch->qp = qp;
627 	ch->recv_cq = recv_cq;
628 	ch->send_cq = send_cq;
629 
630 	if (dev->use_fast_reg) {
631 		if (ch->fr_pool)
632 			srp_destroy_fr_pool(ch->fr_pool);
633 		ch->fr_pool = fr_pool;
634 	} else if (dev->use_fmr) {
635 		if (ch->fmr_pool)
636 			ib_destroy_fmr_pool(ch->fmr_pool);
637 		ch->fmr_pool = fmr_pool;
638 	}
639 
640 	kfree(init_attr);
641 	return 0;
642 
643 err_qp:
644 	if (target->using_rdma_cm)
645 		rdma_destroy_qp(ch->rdma_cm.cm_id);
646 	else
647 		ib_destroy_qp(qp);
648 
649 err_send_cq:
650 	ib_free_cq(send_cq);
651 
652 err_recv_cq:
653 	ib_free_cq(recv_cq);
654 
655 err:
656 	kfree(init_attr);
657 	return ret;
658 }
659 
660 /*
661  * Note: this function may be called without srp_alloc_iu_bufs() having been
662  * invoked. Hence the ch->[rt]x_ring checks.
663  */
664 static void srp_free_ch_ib(struct srp_target_port *target,
665 			   struct srp_rdma_ch *ch)
666 {
667 	struct srp_device *dev = target->srp_host->srp_dev;
668 	int i;
669 
670 	if (!ch->target)
671 		return;
672 
673 	if (target->using_rdma_cm) {
674 		if (ch->rdma_cm.cm_id) {
675 			rdma_destroy_id(ch->rdma_cm.cm_id);
676 			ch->rdma_cm.cm_id = NULL;
677 		}
678 	} else {
679 		if (ch->ib_cm.cm_id) {
680 			ib_destroy_cm_id(ch->ib_cm.cm_id);
681 			ch->ib_cm.cm_id = NULL;
682 		}
683 	}
684 
685 	/* If srp_new_cm_id() succeeded but srp_create_ch_ib() not, return. */
686 	if (!ch->qp)
687 		return;
688 
689 	if (dev->use_fast_reg) {
690 		if (ch->fr_pool)
691 			srp_destroy_fr_pool(ch->fr_pool);
692 	} else if (dev->use_fmr) {
693 		if (ch->fmr_pool)
694 			ib_destroy_fmr_pool(ch->fmr_pool);
695 	}
696 
697 	srp_destroy_qp(ch);
698 	ib_free_cq(ch->send_cq);
699 	ib_free_cq(ch->recv_cq);
700 
701 	/*
702 	 * Avoid that the SCSI error handler tries to use this channel after
703 	 * it has been freed. The SCSI error handler can namely continue
704 	 * trying to perform recovery actions after scsi_remove_host()
705 	 * returned.
706 	 */
707 	ch->target = NULL;
708 
709 	ch->qp = NULL;
710 	ch->send_cq = ch->recv_cq = NULL;
711 
712 	if (ch->rx_ring) {
713 		for (i = 0; i < target->queue_size; ++i)
714 			srp_free_iu(target->srp_host, ch->rx_ring[i]);
715 		kfree(ch->rx_ring);
716 		ch->rx_ring = NULL;
717 	}
718 	if (ch->tx_ring) {
719 		for (i = 0; i < target->queue_size; ++i)
720 			srp_free_iu(target->srp_host, ch->tx_ring[i]);
721 		kfree(ch->tx_ring);
722 		ch->tx_ring = NULL;
723 	}
724 }
725 
726 static void srp_path_rec_completion(int status,
727 				    struct sa_path_rec *pathrec,
728 				    void *ch_ptr)
729 {
730 	struct srp_rdma_ch *ch = ch_ptr;
731 	struct srp_target_port *target = ch->target;
732 
733 	ch->status = status;
734 	if (status)
735 		shost_printk(KERN_ERR, target->scsi_host,
736 			     PFX "Got failed path rec status %d\n", status);
737 	else
738 		ch->ib_cm.path = *pathrec;
739 	complete(&ch->done);
740 }
741 
742 static int srp_ib_lookup_path(struct srp_rdma_ch *ch)
743 {
744 	struct srp_target_port *target = ch->target;
745 	int ret;
746 
747 	ch->ib_cm.path.numb_path = 1;
748 
749 	init_completion(&ch->done);
750 
751 	ch->ib_cm.path_query_id = ib_sa_path_rec_get(&srp_sa_client,
752 					       target->srp_host->srp_dev->dev,
753 					       target->srp_host->port,
754 					       &ch->ib_cm.path,
755 					       IB_SA_PATH_REC_SERVICE_ID |
756 					       IB_SA_PATH_REC_DGID	 |
757 					       IB_SA_PATH_REC_SGID	 |
758 					       IB_SA_PATH_REC_NUMB_PATH	 |
759 					       IB_SA_PATH_REC_PKEY,
760 					       SRP_PATH_REC_TIMEOUT_MS,
761 					       GFP_KERNEL,
762 					       srp_path_rec_completion,
763 					       ch, &ch->ib_cm.path_query);
764 	if (ch->ib_cm.path_query_id < 0)
765 		return ch->ib_cm.path_query_id;
766 
767 	ret = wait_for_completion_interruptible(&ch->done);
768 	if (ret < 0)
769 		return ret;
770 
771 	if (ch->status < 0)
772 		shost_printk(KERN_WARNING, target->scsi_host,
773 			     PFX "Path record query failed: sgid %pI6, dgid %pI6, pkey %#04x, service_id %#16llx\n",
774 			     ch->ib_cm.path.sgid.raw, ch->ib_cm.path.dgid.raw,
775 			     be16_to_cpu(target->ib_cm.pkey),
776 			     be64_to_cpu(target->ib_cm.service_id));
777 
778 	return ch->status;
779 }
780 
781 static int srp_rdma_lookup_path(struct srp_rdma_ch *ch)
782 {
783 	struct srp_target_port *target = ch->target;
784 	int ret;
785 
786 	init_completion(&ch->done);
787 
788 	ret = rdma_resolve_route(ch->rdma_cm.cm_id, SRP_PATH_REC_TIMEOUT_MS);
789 	if (ret)
790 		return ret;
791 
792 	wait_for_completion_interruptible(&ch->done);
793 
794 	if (ch->status != 0)
795 		shost_printk(KERN_WARNING, target->scsi_host,
796 			     PFX "Path resolution failed\n");
797 
798 	return ch->status;
799 }
800 
801 static int srp_lookup_path(struct srp_rdma_ch *ch)
802 {
803 	struct srp_target_port *target = ch->target;
804 
805 	return target->using_rdma_cm ? srp_rdma_lookup_path(ch) :
806 		srp_ib_lookup_path(ch);
807 }
808 
809 static u8 srp_get_subnet_timeout(struct srp_host *host)
810 {
811 	struct ib_port_attr attr;
812 	int ret;
813 	u8 subnet_timeout = 18;
814 
815 	ret = ib_query_port(host->srp_dev->dev, host->port, &attr);
816 	if (ret == 0)
817 		subnet_timeout = attr.subnet_timeout;
818 
819 	if (unlikely(subnet_timeout < 15))
820 		pr_warn("%s: subnet timeout %d may cause SRP login to fail.\n",
821 			dev_name(&host->srp_dev->dev->dev), subnet_timeout);
822 
823 	return subnet_timeout;
824 }
825 
826 static int srp_send_req(struct srp_rdma_ch *ch, bool multich)
827 {
828 	struct srp_target_port *target = ch->target;
829 	struct {
830 		struct rdma_conn_param	  rdma_param;
831 		struct srp_login_req_rdma rdma_req;
832 		struct ib_cm_req_param	  ib_param;
833 		struct srp_login_req	  ib_req;
834 	} *req = NULL;
835 	char *ipi, *tpi;
836 	int status;
837 
838 	req = kzalloc(sizeof *req, GFP_KERNEL);
839 	if (!req)
840 		return -ENOMEM;
841 
842 	req->ib_param.flow_control = 1;
843 	req->ib_param.retry_count = target->tl_retry_count;
844 
845 	/*
846 	 * Pick some arbitrary defaults here; we could make these
847 	 * module parameters if anyone cared about setting them.
848 	 */
849 	req->ib_param.responder_resources = 4;
850 	req->ib_param.rnr_retry_count = 7;
851 	req->ib_param.max_cm_retries = 15;
852 
853 	req->ib_req.opcode = SRP_LOGIN_REQ;
854 	req->ib_req.tag = 0;
855 	req->ib_req.req_it_iu_len = cpu_to_be32(target->max_iu_len);
856 	req->ib_req.req_buf_fmt	= cpu_to_be16(SRP_BUF_FORMAT_DIRECT |
857 					      SRP_BUF_FORMAT_INDIRECT);
858 	req->ib_req.req_flags = (multich ? SRP_MULTICHAN_MULTI :
859 				 SRP_MULTICHAN_SINGLE);
860 
861 	if (target->using_rdma_cm) {
862 		req->rdma_param.flow_control = req->ib_param.flow_control;
863 		req->rdma_param.responder_resources =
864 			req->ib_param.responder_resources;
865 		req->rdma_param.initiator_depth = req->ib_param.initiator_depth;
866 		req->rdma_param.retry_count = req->ib_param.retry_count;
867 		req->rdma_param.rnr_retry_count = req->ib_param.rnr_retry_count;
868 		req->rdma_param.private_data = &req->rdma_req;
869 		req->rdma_param.private_data_len = sizeof(req->rdma_req);
870 
871 		req->rdma_req.opcode = req->ib_req.opcode;
872 		req->rdma_req.tag = req->ib_req.tag;
873 		req->rdma_req.req_it_iu_len = req->ib_req.req_it_iu_len;
874 		req->rdma_req.req_buf_fmt = req->ib_req.req_buf_fmt;
875 		req->rdma_req.req_flags	= req->ib_req.req_flags;
876 
877 		ipi = req->rdma_req.initiator_port_id;
878 		tpi = req->rdma_req.target_port_id;
879 	} else {
880 		u8 subnet_timeout;
881 
882 		subnet_timeout = srp_get_subnet_timeout(target->srp_host);
883 
884 		req->ib_param.primary_path = &ch->ib_cm.path;
885 		req->ib_param.alternate_path = NULL;
886 		req->ib_param.service_id = target->ib_cm.service_id;
887 		get_random_bytes(&req->ib_param.starting_psn, 4);
888 		req->ib_param.starting_psn &= 0xffffff;
889 		req->ib_param.qp_num = ch->qp->qp_num;
890 		req->ib_param.qp_type = ch->qp->qp_type;
891 		req->ib_param.local_cm_response_timeout = subnet_timeout + 2;
892 		req->ib_param.remote_cm_response_timeout = subnet_timeout + 2;
893 		req->ib_param.private_data = &req->ib_req;
894 		req->ib_param.private_data_len = sizeof(req->ib_req);
895 
896 		ipi = req->ib_req.initiator_port_id;
897 		tpi = req->ib_req.target_port_id;
898 	}
899 
900 	/*
901 	 * In the published SRP specification (draft rev. 16a), the
902 	 * port identifier format is 8 bytes of ID extension followed
903 	 * by 8 bytes of GUID.  Older drafts put the two halves in the
904 	 * opposite order, so that the GUID comes first.
905 	 *
906 	 * Targets conforming to these obsolete drafts can be
907 	 * recognized by the I/O Class they report.
908 	 */
909 	if (target->io_class == SRP_REV10_IB_IO_CLASS) {
910 		memcpy(ipi,     &target->sgid.global.interface_id, 8);
911 		memcpy(ipi + 8, &target->initiator_ext, 8);
912 		memcpy(tpi,     &target->ioc_guid, 8);
913 		memcpy(tpi + 8, &target->id_ext, 8);
914 	} else {
915 		memcpy(ipi,     &target->initiator_ext, 8);
916 		memcpy(ipi + 8, &target->sgid.global.interface_id, 8);
917 		memcpy(tpi,     &target->id_ext, 8);
918 		memcpy(tpi + 8, &target->ioc_guid, 8);
919 	}
920 
921 	/*
922 	 * Topspin/Cisco SRP targets will reject our login unless we
923 	 * zero out the first 8 bytes of our initiator port ID and set
924 	 * the second 8 bytes to the local node GUID.
925 	 */
926 	if (srp_target_is_topspin(target)) {
927 		shost_printk(KERN_DEBUG, target->scsi_host,
928 			     PFX "Topspin/Cisco initiator port ID workaround "
929 			     "activated for target GUID %016llx\n",
930 			     be64_to_cpu(target->ioc_guid));
931 		memset(ipi, 0, 8);
932 		memcpy(ipi + 8, &target->srp_host->srp_dev->dev->node_guid, 8);
933 	}
934 
935 	if (target->using_rdma_cm)
936 		status = rdma_connect(ch->rdma_cm.cm_id, &req->rdma_param);
937 	else
938 		status = ib_send_cm_req(ch->ib_cm.cm_id, &req->ib_param);
939 
940 	kfree(req);
941 
942 	return status;
943 }
944 
945 static bool srp_queue_remove_work(struct srp_target_port *target)
946 {
947 	bool changed = false;
948 
949 	spin_lock_irq(&target->lock);
950 	if (target->state != SRP_TARGET_REMOVED) {
951 		target->state = SRP_TARGET_REMOVED;
952 		changed = true;
953 	}
954 	spin_unlock_irq(&target->lock);
955 
956 	if (changed)
957 		queue_work(srp_remove_wq, &target->remove_work);
958 
959 	return changed;
960 }
961 
962 static void srp_disconnect_target(struct srp_target_port *target)
963 {
964 	struct srp_rdma_ch *ch;
965 	int i, ret;
966 
967 	/* XXX should send SRP_I_LOGOUT request */
968 
969 	for (i = 0; i < target->ch_count; i++) {
970 		ch = &target->ch[i];
971 		ch->connected = false;
972 		ret = 0;
973 		if (target->using_rdma_cm) {
974 			if (ch->rdma_cm.cm_id)
975 				rdma_disconnect(ch->rdma_cm.cm_id);
976 		} else {
977 			if (ch->ib_cm.cm_id)
978 				ret = ib_send_cm_dreq(ch->ib_cm.cm_id,
979 						      NULL, 0);
980 		}
981 		if (ret < 0) {
982 			shost_printk(KERN_DEBUG, target->scsi_host,
983 				     PFX "Sending CM DREQ failed\n");
984 		}
985 	}
986 }
987 
988 static void srp_free_req_data(struct srp_target_port *target,
989 			      struct srp_rdma_ch *ch)
990 {
991 	struct srp_device *dev = target->srp_host->srp_dev;
992 	struct ib_device *ibdev = dev->dev;
993 	struct srp_request *req;
994 	int i;
995 
996 	if (!ch->req_ring)
997 		return;
998 
999 	for (i = 0; i < target->req_ring_size; ++i) {
1000 		req = &ch->req_ring[i];
1001 		if (dev->use_fast_reg) {
1002 			kfree(req->fr_list);
1003 		} else {
1004 			kfree(req->fmr_list);
1005 			kfree(req->map_page);
1006 		}
1007 		if (req->indirect_dma_addr) {
1008 			ib_dma_unmap_single(ibdev, req->indirect_dma_addr,
1009 					    target->indirect_size,
1010 					    DMA_TO_DEVICE);
1011 		}
1012 		kfree(req->indirect_desc);
1013 	}
1014 
1015 	kfree(ch->req_ring);
1016 	ch->req_ring = NULL;
1017 }
1018 
1019 static int srp_alloc_req_data(struct srp_rdma_ch *ch)
1020 {
1021 	struct srp_target_port *target = ch->target;
1022 	struct srp_device *srp_dev = target->srp_host->srp_dev;
1023 	struct ib_device *ibdev = srp_dev->dev;
1024 	struct srp_request *req;
1025 	void *mr_list;
1026 	dma_addr_t dma_addr;
1027 	int i, ret = -ENOMEM;
1028 
1029 	ch->req_ring = kcalloc(target->req_ring_size, sizeof(*ch->req_ring),
1030 			       GFP_KERNEL);
1031 	if (!ch->req_ring)
1032 		goto out;
1033 
1034 	for (i = 0; i < target->req_ring_size; ++i) {
1035 		req = &ch->req_ring[i];
1036 		mr_list = kmalloc_array(target->mr_per_cmd, sizeof(void *),
1037 					GFP_KERNEL);
1038 		if (!mr_list)
1039 			goto out;
1040 		if (srp_dev->use_fast_reg) {
1041 			req->fr_list = mr_list;
1042 		} else {
1043 			req->fmr_list = mr_list;
1044 			req->map_page = kmalloc_array(srp_dev->max_pages_per_mr,
1045 						      sizeof(void *),
1046 						      GFP_KERNEL);
1047 			if (!req->map_page)
1048 				goto out;
1049 		}
1050 		req->indirect_desc = kmalloc(target->indirect_size, GFP_KERNEL);
1051 		if (!req->indirect_desc)
1052 			goto out;
1053 
1054 		dma_addr = ib_dma_map_single(ibdev, req->indirect_desc,
1055 					     target->indirect_size,
1056 					     DMA_TO_DEVICE);
1057 		if (ib_dma_mapping_error(ibdev, dma_addr))
1058 			goto out;
1059 
1060 		req->indirect_dma_addr = dma_addr;
1061 	}
1062 	ret = 0;
1063 
1064 out:
1065 	return ret;
1066 }
1067 
1068 /**
1069  * srp_del_scsi_host_attr() - Remove attributes defined in the host template.
1070  * @shost: SCSI host whose attributes to remove from sysfs.
1071  *
1072  * Note: Any attributes defined in the host template and that did not exist
1073  * before invocation of this function will be ignored.
1074  */
1075 static void srp_del_scsi_host_attr(struct Scsi_Host *shost)
1076 {
1077 	struct device_attribute **attr;
1078 
1079 	for (attr = shost->hostt->shost_attrs; attr && *attr; ++attr)
1080 		device_remove_file(&shost->shost_dev, *attr);
1081 }
1082 
1083 static void srp_remove_target(struct srp_target_port *target)
1084 {
1085 	struct srp_rdma_ch *ch;
1086 	int i;
1087 
1088 	WARN_ON_ONCE(target->state != SRP_TARGET_REMOVED);
1089 
1090 	srp_del_scsi_host_attr(target->scsi_host);
1091 	srp_rport_get(target->rport);
1092 	srp_remove_host(target->scsi_host);
1093 	scsi_remove_host(target->scsi_host);
1094 	srp_stop_rport_timers(target->rport);
1095 	srp_disconnect_target(target);
1096 	kobj_ns_drop(KOBJ_NS_TYPE_NET, target->net);
1097 	for (i = 0; i < target->ch_count; i++) {
1098 		ch = &target->ch[i];
1099 		srp_free_ch_ib(target, ch);
1100 	}
1101 	cancel_work_sync(&target->tl_err_work);
1102 	srp_rport_put(target->rport);
1103 	for (i = 0; i < target->ch_count; i++) {
1104 		ch = &target->ch[i];
1105 		srp_free_req_data(target, ch);
1106 	}
1107 	kfree(target->ch);
1108 	target->ch = NULL;
1109 
1110 	spin_lock(&target->srp_host->target_lock);
1111 	list_del(&target->list);
1112 	spin_unlock(&target->srp_host->target_lock);
1113 
1114 	scsi_host_put(target->scsi_host);
1115 }
1116 
1117 static void srp_remove_work(struct work_struct *work)
1118 {
1119 	struct srp_target_port *target =
1120 		container_of(work, struct srp_target_port, remove_work);
1121 
1122 	WARN_ON_ONCE(target->state != SRP_TARGET_REMOVED);
1123 
1124 	srp_remove_target(target);
1125 }
1126 
1127 static void srp_rport_delete(struct srp_rport *rport)
1128 {
1129 	struct srp_target_port *target = rport->lld_data;
1130 
1131 	srp_queue_remove_work(target);
1132 }
1133 
1134 /**
1135  * srp_connected_ch() - number of connected channels
1136  * @target: SRP target port.
1137  */
1138 static int srp_connected_ch(struct srp_target_port *target)
1139 {
1140 	int i, c = 0;
1141 
1142 	for (i = 0; i < target->ch_count; i++)
1143 		c += target->ch[i].connected;
1144 
1145 	return c;
1146 }
1147 
1148 static int srp_connect_ch(struct srp_rdma_ch *ch, bool multich)
1149 {
1150 	struct srp_target_port *target = ch->target;
1151 	int ret;
1152 
1153 	WARN_ON_ONCE(!multich && srp_connected_ch(target) > 0);
1154 
1155 	ret = srp_lookup_path(ch);
1156 	if (ret)
1157 		goto out;
1158 
1159 	while (1) {
1160 		init_completion(&ch->done);
1161 		ret = srp_send_req(ch, multich);
1162 		if (ret)
1163 			goto out;
1164 		ret = wait_for_completion_interruptible(&ch->done);
1165 		if (ret < 0)
1166 			goto out;
1167 
1168 		/*
1169 		 * The CM event handling code will set status to
1170 		 * SRP_PORT_REDIRECT if we get a port redirect REJ
1171 		 * back, or SRP_DLID_REDIRECT if we get a lid/qp
1172 		 * redirect REJ back.
1173 		 */
1174 		ret = ch->status;
1175 		switch (ret) {
1176 		case 0:
1177 			ch->connected = true;
1178 			goto out;
1179 
1180 		case SRP_PORT_REDIRECT:
1181 			ret = srp_lookup_path(ch);
1182 			if (ret)
1183 				goto out;
1184 			break;
1185 
1186 		case SRP_DLID_REDIRECT:
1187 			break;
1188 
1189 		case SRP_STALE_CONN:
1190 			shost_printk(KERN_ERR, target->scsi_host, PFX
1191 				     "giving up on stale connection\n");
1192 			ret = -ECONNRESET;
1193 			goto out;
1194 
1195 		default:
1196 			goto out;
1197 		}
1198 	}
1199 
1200 out:
1201 	return ret <= 0 ? ret : -ENODEV;
1202 }
1203 
1204 static void srp_inv_rkey_err_done(struct ib_cq *cq, struct ib_wc *wc)
1205 {
1206 	srp_handle_qp_err(cq, wc, "INV RKEY");
1207 }
1208 
1209 static int srp_inv_rkey(struct srp_request *req, struct srp_rdma_ch *ch,
1210 		u32 rkey)
1211 {
1212 	struct ib_send_wr wr = {
1213 		.opcode		    = IB_WR_LOCAL_INV,
1214 		.next		    = NULL,
1215 		.num_sge	    = 0,
1216 		.send_flags	    = 0,
1217 		.ex.invalidate_rkey = rkey,
1218 	};
1219 
1220 	wr.wr_cqe = &req->reg_cqe;
1221 	req->reg_cqe.done = srp_inv_rkey_err_done;
1222 	return ib_post_send(ch->qp, &wr, NULL);
1223 }
1224 
1225 static void srp_unmap_data(struct scsi_cmnd *scmnd,
1226 			   struct srp_rdma_ch *ch,
1227 			   struct srp_request *req)
1228 {
1229 	struct srp_target_port *target = ch->target;
1230 	struct srp_device *dev = target->srp_host->srp_dev;
1231 	struct ib_device *ibdev = dev->dev;
1232 	int i, res;
1233 
1234 	if (!scsi_sglist(scmnd) ||
1235 	    (scmnd->sc_data_direction != DMA_TO_DEVICE &&
1236 	     scmnd->sc_data_direction != DMA_FROM_DEVICE))
1237 		return;
1238 
1239 	if (dev->use_fast_reg) {
1240 		struct srp_fr_desc **pfr;
1241 
1242 		for (i = req->nmdesc, pfr = req->fr_list; i > 0; i--, pfr++) {
1243 			res = srp_inv_rkey(req, ch, (*pfr)->mr->rkey);
1244 			if (res < 0) {
1245 				shost_printk(KERN_ERR, target->scsi_host, PFX
1246 				  "Queueing INV WR for rkey %#x failed (%d)\n",
1247 				  (*pfr)->mr->rkey, res);
1248 				queue_work(system_long_wq,
1249 					   &target->tl_err_work);
1250 			}
1251 		}
1252 		if (req->nmdesc)
1253 			srp_fr_pool_put(ch->fr_pool, req->fr_list,
1254 					req->nmdesc);
1255 	} else if (dev->use_fmr) {
1256 		struct ib_pool_fmr **pfmr;
1257 
1258 		for (i = req->nmdesc, pfmr = req->fmr_list; i > 0; i--, pfmr++)
1259 			ib_fmr_pool_unmap(*pfmr);
1260 	}
1261 
1262 	ib_dma_unmap_sg(ibdev, scsi_sglist(scmnd), scsi_sg_count(scmnd),
1263 			scmnd->sc_data_direction);
1264 }
1265 
1266 /**
1267  * srp_claim_req - Take ownership of the scmnd associated with a request.
1268  * @ch: SRP RDMA channel.
1269  * @req: SRP request.
1270  * @sdev: If not NULL, only take ownership for this SCSI device.
1271  * @scmnd: If NULL, take ownership of @req->scmnd. If not NULL, only take
1272  *         ownership of @req->scmnd if it equals @scmnd.
1273  *
1274  * Return value:
1275  * Either NULL or a pointer to the SCSI command the caller became owner of.
1276  */
1277 static struct scsi_cmnd *srp_claim_req(struct srp_rdma_ch *ch,
1278 				       struct srp_request *req,
1279 				       struct scsi_device *sdev,
1280 				       struct scsi_cmnd *scmnd)
1281 {
1282 	unsigned long flags;
1283 
1284 	spin_lock_irqsave(&ch->lock, flags);
1285 	if (req->scmnd &&
1286 	    (!sdev || req->scmnd->device == sdev) &&
1287 	    (!scmnd || req->scmnd == scmnd)) {
1288 		scmnd = req->scmnd;
1289 		req->scmnd = NULL;
1290 	} else {
1291 		scmnd = NULL;
1292 	}
1293 	spin_unlock_irqrestore(&ch->lock, flags);
1294 
1295 	return scmnd;
1296 }
1297 
1298 /**
1299  * srp_free_req() - Unmap data and adjust ch->req_lim.
1300  * @ch:     SRP RDMA channel.
1301  * @req:    Request to be freed.
1302  * @scmnd:  SCSI command associated with @req.
1303  * @req_lim_delta: Amount to be added to @target->req_lim.
1304  */
1305 static void srp_free_req(struct srp_rdma_ch *ch, struct srp_request *req,
1306 			 struct scsi_cmnd *scmnd, s32 req_lim_delta)
1307 {
1308 	unsigned long flags;
1309 
1310 	srp_unmap_data(scmnd, ch, req);
1311 
1312 	spin_lock_irqsave(&ch->lock, flags);
1313 	ch->req_lim += req_lim_delta;
1314 	spin_unlock_irqrestore(&ch->lock, flags);
1315 }
1316 
1317 static void srp_finish_req(struct srp_rdma_ch *ch, struct srp_request *req,
1318 			   struct scsi_device *sdev, int result)
1319 {
1320 	struct scsi_cmnd *scmnd = srp_claim_req(ch, req, sdev, NULL);
1321 
1322 	if (scmnd) {
1323 		srp_free_req(ch, req, scmnd, 0);
1324 		scmnd->result = result;
1325 		scmnd->scsi_done(scmnd);
1326 	}
1327 }
1328 
1329 static void srp_terminate_io(struct srp_rport *rport)
1330 {
1331 	struct srp_target_port *target = rport->lld_data;
1332 	struct srp_rdma_ch *ch;
1333 	struct Scsi_Host *shost = target->scsi_host;
1334 	struct scsi_device *sdev;
1335 	int i, j;
1336 
1337 	/*
1338 	 * Invoking srp_terminate_io() while srp_queuecommand() is running
1339 	 * is not safe. Hence the warning statement below.
1340 	 */
1341 	shost_for_each_device(sdev, shost)
1342 		WARN_ON_ONCE(sdev->request_queue->request_fn_active);
1343 
1344 	for (i = 0; i < target->ch_count; i++) {
1345 		ch = &target->ch[i];
1346 
1347 		for (j = 0; j < target->req_ring_size; ++j) {
1348 			struct srp_request *req = &ch->req_ring[j];
1349 
1350 			srp_finish_req(ch, req, NULL,
1351 				       DID_TRANSPORT_FAILFAST << 16);
1352 		}
1353 	}
1354 }
1355 
1356 /*
1357  * It is up to the caller to ensure that srp_rport_reconnect() calls are
1358  * serialized and that no concurrent srp_queuecommand(), srp_abort(),
1359  * srp_reset_device() or srp_reset_host() calls will occur while this function
1360  * is in progress. One way to realize that is not to call this function
1361  * directly but to call srp_reconnect_rport() instead since that last function
1362  * serializes calls of this function via rport->mutex and also blocks
1363  * srp_queuecommand() calls before invoking this function.
1364  */
1365 static int srp_rport_reconnect(struct srp_rport *rport)
1366 {
1367 	struct srp_target_port *target = rport->lld_data;
1368 	struct srp_rdma_ch *ch;
1369 	int i, j, ret = 0;
1370 	bool multich = false;
1371 
1372 	srp_disconnect_target(target);
1373 
1374 	if (target->state == SRP_TARGET_SCANNING)
1375 		return -ENODEV;
1376 
1377 	/*
1378 	 * Now get a new local CM ID so that we avoid confusing the target in
1379 	 * case things are really fouled up. Doing so also ensures that all CM
1380 	 * callbacks will have finished before a new QP is allocated.
1381 	 */
1382 	for (i = 0; i < target->ch_count; i++) {
1383 		ch = &target->ch[i];
1384 		ret += srp_new_cm_id(ch);
1385 	}
1386 	for (i = 0; i < target->ch_count; i++) {
1387 		ch = &target->ch[i];
1388 		for (j = 0; j < target->req_ring_size; ++j) {
1389 			struct srp_request *req = &ch->req_ring[j];
1390 
1391 			srp_finish_req(ch, req, NULL, DID_RESET << 16);
1392 		}
1393 	}
1394 	for (i = 0; i < target->ch_count; i++) {
1395 		ch = &target->ch[i];
1396 		/*
1397 		 * Whether or not creating a new CM ID succeeded, create a new
1398 		 * QP. This guarantees that all completion callback function
1399 		 * invocations have finished before request resetting starts.
1400 		 */
1401 		ret += srp_create_ch_ib(ch);
1402 
1403 		INIT_LIST_HEAD(&ch->free_tx);
1404 		for (j = 0; j < target->queue_size; ++j)
1405 			list_add(&ch->tx_ring[j]->list, &ch->free_tx);
1406 	}
1407 
1408 	target->qp_in_error = false;
1409 
1410 	for (i = 0; i < target->ch_count; i++) {
1411 		ch = &target->ch[i];
1412 		if (ret)
1413 			break;
1414 		ret = srp_connect_ch(ch, multich);
1415 		multich = true;
1416 	}
1417 
1418 	if (ret == 0)
1419 		shost_printk(KERN_INFO, target->scsi_host,
1420 			     PFX "reconnect succeeded\n");
1421 
1422 	return ret;
1423 }
1424 
1425 static void srp_map_desc(struct srp_map_state *state, dma_addr_t dma_addr,
1426 			 unsigned int dma_len, u32 rkey)
1427 {
1428 	struct srp_direct_buf *desc = state->desc;
1429 
1430 	WARN_ON_ONCE(!dma_len);
1431 
1432 	desc->va = cpu_to_be64(dma_addr);
1433 	desc->key = cpu_to_be32(rkey);
1434 	desc->len = cpu_to_be32(dma_len);
1435 
1436 	state->total_len += dma_len;
1437 	state->desc++;
1438 	state->ndesc++;
1439 }
1440 
1441 static int srp_map_finish_fmr(struct srp_map_state *state,
1442 			      struct srp_rdma_ch *ch)
1443 {
1444 	struct srp_target_port *target = ch->target;
1445 	struct srp_device *dev = target->srp_host->srp_dev;
1446 	struct ib_pool_fmr *fmr;
1447 	u64 io_addr = 0;
1448 
1449 	if (state->fmr.next >= state->fmr.end) {
1450 		shost_printk(KERN_ERR, ch->target->scsi_host,
1451 			     PFX "Out of MRs (mr_per_cmd = %d)\n",
1452 			     ch->target->mr_per_cmd);
1453 		return -ENOMEM;
1454 	}
1455 
1456 	WARN_ON_ONCE(!dev->use_fmr);
1457 
1458 	if (state->npages == 0)
1459 		return 0;
1460 
1461 	if (state->npages == 1 && target->global_rkey) {
1462 		srp_map_desc(state, state->base_dma_addr, state->dma_len,
1463 			     target->global_rkey);
1464 		goto reset_state;
1465 	}
1466 
1467 	fmr = ib_fmr_pool_map_phys(ch->fmr_pool, state->pages,
1468 				   state->npages, io_addr);
1469 	if (IS_ERR(fmr))
1470 		return PTR_ERR(fmr);
1471 
1472 	*state->fmr.next++ = fmr;
1473 	state->nmdesc++;
1474 
1475 	srp_map_desc(state, state->base_dma_addr & ~dev->mr_page_mask,
1476 		     state->dma_len, fmr->fmr->rkey);
1477 
1478 reset_state:
1479 	state->npages = 0;
1480 	state->dma_len = 0;
1481 
1482 	return 0;
1483 }
1484 
1485 static void srp_reg_mr_err_done(struct ib_cq *cq, struct ib_wc *wc)
1486 {
1487 	srp_handle_qp_err(cq, wc, "FAST REG");
1488 }
1489 
1490 /*
1491  * Map up to sg_nents elements of state->sg where *sg_offset_p is the offset
1492  * where to start in the first element. If sg_offset_p != NULL then
1493  * *sg_offset_p is updated to the offset in state->sg[retval] of the first
1494  * byte that has not yet been mapped.
1495  */
1496 static int srp_map_finish_fr(struct srp_map_state *state,
1497 			     struct srp_request *req,
1498 			     struct srp_rdma_ch *ch, int sg_nents,
1499 			     unsigned int *sg_offset_p)
1500 {
1501 	struct srp_target_port *target = ch->target;
1502 	struct srp_device *dev = target->srp_host->srp_dev;
1503 	struct ib_reg_wr wr;
1504 	struct srp_fr_desc *desc;
1505 	u32 rkey;
1506 	int n, err;
1507 
1508 	if (state->fr.next >= state->fr.end) {
1509 		shost_printk(KERN_ERR, ch->target->scsi_host,
1510 			     PFX "Out of MRs (mr_per_cmd = %d)\n",
1511 			     ch->target->mr_per_cmd);
1512 		return -ENOMEM;
1513 	}
1514 
1515 	WARN_ON_ONCE(!dev->use_fast_reg);
1516 
1517 	if (sg_nents == 1 && target->global_rkey) {
1518 		unsigned int sg_offset = sg_offset_p ? *sg_offset_p : 0;
1519 
1520 		srp_map_desc(state, sg_dma_address(state->sg) + sg_offset,
1521 			     sg_dma_len(state->sg) - sg_offset,
1522 			     target->global_rkey);
1523 		if (sg_offset_p)
1524 			*sg_offset_p = 0;
1525 		return 1;
1526 	}
1527 
1528 	desc = srp_fr_pool_get(ch->fr_pool);
1529 	if (!desc)
1530 		return -ENOMEM;
1531 
1532 	rkey = ib_inc_rkey(desc->mr->rkey);
1533 	ib_update_fast_reg_key(desc->mr, rkey);
1534 
1535 	n = ib_map_mr_sg(desc->mr, state->sg, sg_nents, sg_offset_p,
1536 			 dev->mr_page_size);
1537 	if (unlikely(n < 0)) {
1538 		srp_fr_pool_put(ch->fr_pool, &desc, 1);
1539 		pr_debug("%s: ib_map_mr_sg(%d, %d) returned %d.\n",
1540 			 dev_name(&req->scmnd->device->sdev_gendev), sg_nents,
1541 			 sg_offset_p ? *sg_offset_p : -1, n);
1542 		return n;
1543 	}
1544 
1545 	WARN_ON_ONCE(desc->mr->length == 0);
1546 
1547 	req->reg_cqe.done = srp_reg_mr_err_done;
1548 
1549 	wr.wr.next = NULL;
1550 	wr.wr.opcode = IB_WR_REG_MR;
1551 	wr.wr.wr_cqe = &req->reg_cqe;
1552 	wr.wr.num_sge = 0;
1553 	wr.wr.send_flags = 0;
1554 	wr.mr = desc->mr;
1555 	wr.key = desc->mr->rkey;
1556 	wr.access = (IB_ACCESS_LOCAL_WRITE |
1557 		     IB_ACCESS_REMOTE_READ |
1558 		     IB_ACCESS_REMOTE_WRITE);
1559 
1560 	*state->fr.next++ = desc;
1561 	state->nmdesc++;
1562 
1563 	srp_map_desc(state, desc->mr->iova,
1564 		     desc->mr->length, desc->mr->rkey);
1565 
1566 	err = ib_post_send(ch->qp, &wr.wr, NULL);
1567 	if (unlikely(err)) {
1568 		WARN_ON_ONCE(err == -ENOMEM);
1569 		return err;
1570 	}
1571 
1572 	return n;
1573 }
1574 
1575 static int srp_map_sg_entry(struct srp_map_state *state,
1576 			    struct srp_rdma_ch *ch,
1577 			    struct scatterlist *sg)
1578 {
1579 	struct srp_target_port *target = ch->target;
1580 	struct srp_device *dev = target->srp_host->srp_dev;
1581 	struct ib_device *ibdev = dev->dev;
1582 	dma_addr_t dma_addr = ib_sg_dma_address(ibdev, sg);
1583 	unsigned int dma_len = ib_sg_dma_len(ibdev, sg);
1584 	unsigned int len = 0;
1585 	int ret;
1586 
1587 	WARN_ON_ONCE(!dma_len);
1588 
1589 	while (dma_len) {
1590 		unsigned offset = dma_addr & ~dev->mr_page_mask;
1591 
1592 		if (state->npages == dev->max_pages_per_mr ||
1593 		    (state->npages > 0 && offset != 0)) {
1594 			ret = srp_map_finish_fmr(state, ch);
1595 			if (ret)
1596 				return ret;
1597 		}
1598 
1599 		len = min_t(unsigned int, dma_len, dev->mr_page_size - offset);
1600 
1601 		if (!state->npages)
1602 			state->base_dma_addr = dma_addr;
1603 		state->pages[state->npages++] = dma_addr & dev->mr_page_mask;
1604 		state->dma_len += len;
1605 		dma_addr += len;
1606 		dma_len -= len;
1607 	}
1608 
1609 	/*
1610 	 * If the end of the MR is not on a page boundary then we need to
1611 	 * close it out and start a new one -- we can only merge at page
1612 	 * boundaries.
1613 	 */
1614 	ret = 0;
1615 	if ((dma_addr & ~dev->mr_page_mask) != 0)
1616 		ret = srp_map_finish_fmr(state, ch);
1617 	return ret;
1618 }
1619 
1620 static int srp_map_sg_fmr(struct srp_map_state *state, struct srp_rdma_ch *ch,
1621 			  struct srp_request *req, struct scatterlist *scat,
1622 			  int count)
1623 {
1624 	struct scatterlist *sg;
1625 	int i, ret;
1626 
1627 	state->pages = req->map_page;
1628 	state->fmr.next = req->fmr_list;
1629 	state->fmr.end = req->fmr_list + ch->target->mr_per_cmd;
1630 
1631 	for_each_sg(scat, sg, count, i) {
1632 		ret = srp_map_sg_entry(state, ch, sg);
1633 		if (ret)
1634 			return ret;
1635 	}
1636 
1637 	ret = srp_map_finish_fmr(state, ch);
1638 	if (ret)
1639 		return ret;
1640 
1641 	return 0;
1642 }
1643 
1644 static int srp_map_sg_fr(struct srp_map_state *state, struct srp_rdma_ch *ch,
1645 			 struct srp_request *req, struct scatterlist *scat,
1646 			 int count)
1647 {
1648 	unsigned int sg_offset = 0;
1649 
1650 	state->fr.next = req->fr_list;
1651 	state->fr.end = req->fr_list + ch->target->mr_per_cmd;
1652 	state->sg = scat;
1653 
1654 	if (count == 0)
1655 		return 0;
1656 
1657 	while (count) {
1658 		int i, n;
1659 
1660 		n = srp_map_finish_fr(state, req, ch, count, &sg_offset);
1661 		if (unlikely(n < 0))
1662 			return n;
1663 
1664 		count -= n;
1665 		for (i = 0; i < n; i++)
1666 			state->sg = sg_next(state->sg);
1667 	}
1668 
1669 	return 0;
1670 }
1671 
1672 static int srp_map_sg_dma(struct srp_map_state *state, struct srp_rdma_ch *ch,
1673 			  struct srp_request *req, struct scatterlist *scat,
1674 			  int count)
1675 {
1676 	struct srp_target_port *target = ch->target;
1677 	struct srp_device *dev = target->srp_host->srp_dev;
1678 	struct scatterlist *sg;
1679 	int i;
1680 
1681 	for_each_sg(scat, sg, count, i) {
1682 		srp_map_desc(state, ib_sg_dma_address(dev->dev, sg),
1683 			     ib_sg_dma_len(dev->dev, sg),
1684 			     target->global_rkey);
1685 	}
1686 
1687 	return 0;
1688 }
1689 
1690 /*
1691  * Register the indirect data buffer descriptor with the HCA.
1692  *
1693  * Note: since the indirect data buffer descriptor has been allocated with
1694  * kmalloc() it is guaranteed that this buffer is a physically contiguous
1695  * memory buffer.
1696  */
1697 static int srp_map_idb(struct srp_rdma_ch *ch, struct srp_request *req,
1698 		       void **next_mr, void **end_mr, u32 idb_len,
1699 		       __be32 *idb_rkey)
1700 {
1701 	struct srp_target_port *target = ch->target;
1702 	struct srp_device *dev = target->srp_host->srp_dev;
1703 	struct srp_map_state state;
1704 	struct srp_direct_buf idb_desc;
1705 	u64 idb_pages[1];
1706 	struct scatterlist idb_sg[1];
1707 	int ret;
1708 
1709 	memset(&state, 0, sizeof(state));
1710 	memset(&idb_desc, 0, sizeof(idb_desc));
1711 	state.gen.next = next_mr;
1712 	state.gen.end = end_mr;
1713 	state.desc = &idb_desc;
1714 	state.base_dma_addr = req->indirect_dma_addr;
1715 	state.dma_len = idb_len;
1716 
1717 	if (dev->use_fast_reg) {
1718 		state.sg = idb_sg;
1719 		sg_init_one(idb_sg, req->indirect_desc, idb_len);
1720 		idb_sg->dma_address = req->indirect_dma_addr; /* hack! */
1721 #ifdef CONFIG_NEED_SG_DMA_LENGTH
1722 		idb_sg->dma_length = idb_sg->length;	      /* hack^2 */
1723 #endif
1724 		ret = srp_map_finish_fr(&state, req, ch, 1, NULL);
1725 		if (ret < 0)
1726 			return ret;
1727 		WARN_ON_ONCE(ret < 1);
1728 	} else if (dev->use_fmr) {
1729 		state.pages = idb_pages;
1730 		state.pages[0] = (req->indirect_dma_addr &
1731 				  dev->mr_page_mask);
1732 		state.npages = 1;
1733 		ret = srp_map_finish_fmr(&state, ch);
1734 		if (ret < 0)
1735 			return ret;
1736 	} else {
1737 		return -EINVAL;
1738 	}
1739 
1740 	*idb_rkey = idb_desc.key;
1741 
1742 	return 0;
1743 }
1744 
1745 static void srp_check_mapping(struct srp_map_state *state,
1746 			      struct srp_rdma_ch *ch, struct srp_request *req,
1747 			      struct scatterlist *scat, int count)
1748 {
1749 	struct srp_device *dev = ch->target->srp_host->srp_dev;
1750 	struct srp_fr_desc **pfr;
1751 	u64 desc_len = 0, mr_len = 0;
1752 	int i;
1753 
1754 	for (i = 0; i < state->ndesc; i++)
1755 		desc_len += be32_to_cpu(req->indirect_desc[i].len);
1756 	if (dev->use_fast_reg)
1757 		for (i = 0, pfr = req->fr_list; i < state->nmdesc; i++, pfr++)
1758 			mr_len += (*pfr)->mr->length;
1759 	else if (dev->use_fmr)
1760 		for (i = 0; i < state->nmdesc; i++)
1761 			mr_len += be32_to_cpu(req->indirect_desc[i].len);
1762 	if (desc_len != scsi_bufflen(req->scmnd) ||
1763 	    mr_len > scsi_bufflen(req->scmnd))
1764 		pr_err("Inconsistent: scsi len %d <> desc len %lld <> mr len %lld; ndesc %d; nmdesc = %d\n",
1765 		       scsi_bufflen(req->scmnd), desc_len, mr_len,
1766 		       state->ndesc, state->nmdesc);
1767 }
1768 
1769 /**
1770  * srp_map_data() - map SCSI data buffer onto an SRP request
1771  * @scmnd: SCSI command to map
1772  * @ch: SRP RDMA channel
1773  * @req: SRP request
1774  *
1775  * Returns the length in bytes of the SRP_CMD IU or a negative value if
1776  * mapping failed.
1777  */
1778 static int srp_map_data(struct scsi_cmnd *scmnd, struct srp_rdma_ch *ch,
1779 			struct srp_request *req)
1780 {
1781 	struct srp_target_port *target = ch->target;
1782 	struct scatterlist *scat;
1783 	struct srp_cmd *cmd = req->cmd->buf;
1784 	int len, nents, count, ret;
1785 	struct srp_device *dev;
1786 	struct ib_device *ibdev;
1787 	struct srp_map_state state;
1788 	struct srp_indirect_buf *indirect_hdr;
1789 	u32 idb_len, table_len;
1790 	__be32 idb_rkey;
1791 	u8 fmt;
1792 
1793 	if (!scsi_sglist(scmnd) || scmnd->sc_data_direction == DMA_NONE)
1794 		return sizeof (struct srp_cmd);
1795 
1796 	if (scmnd->sc_data_direction != DMA_FROM_DEVICE &&
1797 	    scmnd->sc_data_direction != DMA_TO_DEVICE) {
1798 		shost_printk(KERN_WARNING, target->scsi_host,
1799 			     PFX "Unhandled data direction %d\n",
1800 			     scmnd->sc_data_direction);
1801 		return -EINVAL;
1802 	}
1803 
1804 	nents = scsi_sg_count(scmnd);
1805 	scat  = scsi_sglist(scmnd);
1806 
1807 	dev = target->srp_host->srp_dev;
1808 	ibdev = dev->dev;
1809 
1810 	count = ib_dma_map_sg(ibdev, scat, nents, scmnd->sc_data_direction);
1811 	if (unlikely(count == 0))
1812 		return -EIO;
1813 
1814 	fmt = SRP_DATA_DESC_DIRECT;
1815 	len = sizeof (struct srp_cmd) +	sizeof (struct srp_direct_buf);
1816 
1817 	if (count == 1 && target->global_rkey) {
1818 		/*
1819 		 * The midlayer only generated a single gather/scatter
1820 		 * entry, or DMA mapping coalesced everything to a
1821 		 * single entry.  So a direct descriptor along with
1822 		 * the DMA MR suffices.
1823 		 */
1824 		struct srp_direct_buf *buf = (void *) cmd->add_data;
1825 
1826 		buf->va  = cpu_to_be64(ib_sg_dma_address(ibdev, scat));
1827 		buf->key = cpu_to_be32(target->global_rkey);
1828 		buf->len = cpu_to_be32(ib_sg_dma_len(ibdev, scat));
1829 
1830 		req->nmdesc = 0;
1831 		goto map_complete;
1832 	}
1833 
1834 	/*
1835 	 * We have more than one scatter/gather entry, so build our indirect
1836 	 * descriptor table, trying to merge as many entries as we can.
1837 	 */
1838 	indirect_hdr = (void *) cmd->add_data;
1839 
1840 	ib_dma_sync_single_for_cpu(ibdev, req->indirect_dma_addr,
1841 				   target->indirect_size, DMA_TO_DEVICE);
1842 
1843 	memset(&state, 0, sizeof(state));
1844 	state.desc = req->indirect_desc;
1845 	if (dev->use_fast_reg)
1846 		ret = srp_map_sg_fr(&state, ch, req, scat, count);
1847 	else if (dev->use_fmr)
1848 		ret = srp_map_sg_fmr(&state, ch, req, scat, count);
1849 	else
1850 		ret = srp_map_sg_dma(&state, ch, req, scat, count);
1851 	req->nmdesc = state.nmdesc;
1852 	if (ret < 0)
1853 		goto unmap;
1854 
1855 	{
1856 		DEFINE_DYNAMIC_DEBUG_METADATA(ddm,
1857 			"Memory mapping consistency check");
1858 		if (DYNAMIC_DEBUG_BRANCH(ddm))
1859 			srp_check_mapping(&state, ch, req, scat, count);
1860 	}
1861 
1862 	/* We've mapped the request, now pull as much of the indirect
1863 	 * descriptor table as we can into the command buffer. If this
1864 	 * target is not using an external indirect table, we are
1865 	 * guaranteed to fit into the command, as the SCSI layer won't
1866 	 * give us more S/G entries than we allow.
1867 	 */
1868 	if (state.ndesc == 1) {
1869 		/*
1870 		 * Memory registration collapsed the sg-list into one entry,
1871 		 * so use a direct descriptor.
1872 		 */
1873 		struct srp_direct_buf *buf = (void *) cmd->add_data;
1874 
1875 		*buf = req->indirect_desc[0];
1876 		goto map_complete;
1877 	}
1878 
1879 	if (unlikely(target->cmd_sg_cnt < state.ndesc &&
1880 						!target->allow_ext_sg)) {
1881 		shost_printk(KERN_ERR, target->scsi_host,
1882 			     "Could not fit S/G list into SRP_CMD\n");
1883 		ret = -EIO;
1884 		goto unmap;
1885 	}
1886 
1887 	count = min(state.ndesc, target->cmd_sg_cnt);
1888 	table_len = state.ndesc * sizeof (struct srp_direct_buf);
1889 	idb_len = sizeof(struct srp_indirect_buf) + table_len;
1890 
1891 	fmt = SRP_DATA_DESC_INDIRECT;
1892 	len = sizeof(struct srp_cmd) + sizeof (struct srp_indirect_buf);
1893 	len += count * sizeof (struct srp_direct_buf);
1894 
1895 	memcpy(indirect_hdr->desc_list, req->indirect_desc,
1896 	       count * sizeof (struct srp_direct_buf));
1897 
1898 	if (!target->global_rkey) {
1899 		ret = srp_map_idb(ch, req, state.gen.next, state.gen.end,
1900 				  idb_len, &idb_rkey);
1901 		if (ret < 0)
1902 			goto unmap;
1903 		req->nmdesc++;
1904 	} else {
1905 		idb_rkey = cpu_to_be32(target->global_rkey);
1906 	}
1907 
1908 	indirect_hdr->table_desc.va = cpu_to_be64(req->indirect_dma_addr);
1909 	indirect_hdr->table_desc.key = idb_rkey;
1910 	indirect_hdr->table_desc.len = cpu_to_be32(table_len);
1911 	indirect_hdr->len = cpu_to_be32(state.total_len);
1912 
1913 	if (scmnd->sc_data_direction == DMA_TO_DEVICE)
1914 		cmd->data_out_desc_cnt = count;
1915 	else
1916 		cmd->data_in_desc_cnt = count;
1917 
1918 	ib_dma_sync_single_for_device(ibdev, req->indirect_dma_addr, table_len,
1919 				      DMA_TO_DEVICE);
1920 
1921 map_complete:
1922 	if (scmnd->sc_data_direction == DMA_TO_DEVICE)
1923 		cmd->buf_fmt = fmt << 4;
1924 	else
1925 		cmd->buf_fmt = fmt;
1926 
1927 	return len;
1928 
1929 unmap:
1930 	srp_unmap_data(scmnd, ch, req);
1931 	if (ret == -ENOMEM && req->nmdesc >= target->mr_pool_size)
1932 		ret = -E2BIG;
1933 	return ret;
1934 }
1935 
1936 /*
1937  * Return an IU and possible credit to the free pool
1938  */
1939 static void srp_put_tx_iu(struct srp_rdma_ch *ch, struct srp_iu *iu,
1940 			  enum srp_iu_type iu_type)
1941 {
1942 	unsigned long flags;
1943 
1944 	spin_lock_irqsave(&ch->lock, flags);
1945 	list_add(&iu->list, &ch->free_tx);
1946 	if (iu_type != SRP_IU_RSP)
1947 		++ch->req_lim;
1948 	spin_unlock_irqrestore(&ch->lock, flags);
1949 }
1950 
1951 /*
1952  * Must be called with ch->lock held to protect req_lim and free_tx.
1953  * If IU is not sent, it must be returned using srp_put_tx_iu().
1954  *
1955  * Note:
1956  * An upper limit for the number of allocated information units for each
1957  * request type is:
1958  * - SRP_IU_CMD: SRP_CMD_SQ_SIZE, since the SCSI mid-layer never queues
1959  *   more than Scsi_Host.can_queue requests.
1960  * - SRP_IU_TSK_MGMT: SRP_TSK_MGMT_SQ_SIZE.
1961  * - SRP_IU_RSP: 1, since a conforming SRP target never sends more than
1962  *   one unanswered SRP request to an initiator.
1963  */
1964 static struct srp_iu *__srp_get_tx_iu(struct srp_rdma_ch *ch,
1965 				      enum srp_iu_type iu_type)
1966 {
1967 	struct srp_target_port *target = ch->target;
1968 	s32 rsv = (iu_type == SRP_IU_TSK_MGMT) ? 0 : SRP_TSK_MGMT_SQ_SIZE;
1969 	struct srp_iu *iu;
1970 
1971 	lockdep_assert_held(&ch->lock);
1972 
1973 	ib_process_cq_direct(ch->send_cq, -1);
1974 
1975 	if (list_empty(&ch->free_tx))
1976 		return NULL;
1977 
1978 	/* Initiator responses to target requests do not consume credits */
1979 	if (iu_type != SRP_IU_RSP) {
1980 		if (ch->req_lim <= rsv) {
1981 			++target->zero_req_lim;
1982 			return NULL;
1983 		}
1984 
1985 		--ch->req_lim;
1986 	}
1987 
1988 	iu = list_first_entry(&ch->free_tx, struct srp_iu, list);
1989 	list_del(&iu->list);
1990 	return iu;
1991 }
1992 
1993 /*
1994  * Note: if this function is called from inside ib_drain_sq() then it will
1995  * be called without ch->lock being held. If ib_drain_sq() dequeues a WQE
1996  * with status IB_WC_SUCCESS then that's a bug.
1997  */
1998 static void srp_send_done(struct ib_cq *cq, struct ib_wc *wc)
1999 {
2000 	struct srp_iu *iu = container_of(wc->wr_cqe, struct srp_iu, cqe);
2001 	struct srp_rdma_ch *ch = cq->cq_context;
2002 
2003 	if (unlikely(wc->status != IB_WC_SUCCESS)) {
2004 		srp_handle_qp_err(cq, wc, "SEND");
2005 		return;
2006 	}
2007 
2008 	lockdep_assert_held(&ch->lock);
2009 
2010 	list_add(&iu->list, &ch->free_tx);
2011 }
2012 
2013 static int srp_post_send(struct srp_rdma_ch *ch, struct srp_iu *iu, int len)
2014 {
2015 	struct srp_target_port *target = ch->target;
2016 	struct ib_sge list;
2017 	struct ib_send_wr wr;
2018 
2019 	list.addr   = iu->dma;
2020 	list.length = len;
2021 	list.lkey   = target->lkey;
2022 
2023 	iu->cqe.done = srp_send_done;
2024 
2025 	wr.next       = NULL;
2026 	wr.wr_cqe     = &iu->cqe;
2027 	wr.sg_list    = &list;
2028 	wr.num_sge    = 1;
2029 	wr.opcode     = IB_WR_SEND;
2030 	wr.send_flags = IB_SEND_SIGNALED;
2031 
2032 	return ib_post_send(ch->qp, &wr, NULL);
2033 }
2034 
2035 static int srp_post_recv(struct srp_rdma_ch *ch, struct srp_iu *iu)
2036 {
2037 	struct srp_target_port *target = ch->target;
2038 	struct ib_recv_wr wr;
2039 	struct ib_sge list;
2040 
2041 	list.addr   = iu->dma;
2042 	list.length = iu->size;
2043 	list.lkey   = target->lkey;
2044 
2045 	iu->cqe.done = srp_recv_done;
2046 
2047 	wr.next     = NULL;
2048 	wr.wr_cqe   = &iu->cqe;
2049 	wr.sg_list  = &list;
2050 	wr.num_sge  = 1;
2051 
2052 	return ib_post_recv(ch->qp, &wr, NULL);
2053 }
2054 
2055 static void srp_process_rsp(struct srp_rdma_ch *ch, struct srp_rsp *rsp)
2056 {
2057 	struct srp_target_port *target = ch->target;
2058 	struct srp_request *req;
2059 	struct scsi_cmnd *scmnd;
2060 	unsigned long flags;
2061 
2062 	if (unlikely(rsp->tag & SRP_TAG_TSK_MGMT)) {
2063 		spin_lock_irqsave(&ch->lock, flags);
2064 		ch->req_lim += be32_to_cpu(rsp->req_lim_delta);
2065 		if (rsp->tag == ch->tsk_mgmt_tag) {
2066 			ch->tsk_mgmt_status = -1;
2067 			if (be32_to_cpu(rsp->resp_data_len) >= 4)
2068 				ch->tsk_mgmt_status = rsp->data[3];
2069 			complete(&ch->tsk_mgmt_done);
2070 		} else {
2071 			shost_printk(KERN_ERR, target->scsi_host,
2072 				     "Received tsk mgmt response too late for tag %#llx\n",
2073 				     rsp->tag);
2074 		}
2075 		spin_unlock_irqrestore(&ch->lock, flags);
2076 	} else {
2077 		scmnd = scsi_host_find_tag(target->scsi_host, rsp->tag);
2078 		if (scmnd && scmnd->host_scribble) {
2079 			req = (void *)scmnd->host_scribble;
2080 			scmnd = srp_claim_req(ch, req, NULL, scmnd);
2081 		} else {
2082 			scmnd = NULL;
2083 		}
2084 		if (!scmnd) {
2085 			shost_printk(KERN_ERR, target->scsi_host,
2086 				     "Null scmnd for RSP w/tag %#016llx received on ch %td / QP %#x\n",
2087 				     rsp->tag, ch - target->ch, ch->qp->qp_num);
2088 
2089 			spin_lock_irqsave(&ch->lock, flags);
2090 			ch->req_lim += be32_to_cpu(rsp->req_lim_delta);
2091 			spin_unlock_irqrestore(&ch->lock, flags);
2092 
2093 			return;
2094 		}
2095 		scmnd->result = rsp->status;
2096 
2097 		if (rsp->flags & SRP_RSP_FLAG_SNSVALID) {
2098 			memcpy(scmnd->sense_buffer, rsp->data +
2099 			       be32_to_cpu(rsp->resp_data_len),
2100 			       min_t(int, be32_to_cpu(rsp->sense_data_len),
2101 				     SCSI_SENSE_BUFFERSIZE));
2102 		}
2103 
2104 		if (unlikely(rsp->flags & SRP_RSP_FLAG_DIUNDER))
2105 			scsi_set_resid(scmnd, be32_to_cpu(rsp->data_in_res_cnt));
2106 		else if (unlikely(rsp->flags & SRP_RSP_FLAG_DIOVER))
2107 			scsi_set_resid(scmnd, -be32_to_cpu(rsp->data_in_res_cnt));
2108 		else if (unlikely(rsp->flags & SRP_RSP_FLAG_DOUNDER))
2109 			scsi_set_resid(scmnd, be32_to_cpu(rsp->data_out_res_cnt));
2110 		else if (unlikely(rsp->flags & SRP_RSP_FLAG_DOOVER))
2111 			scsi_set_resid(scmnd, -be32_to_cpu(rsp->data_out_res_cnt));
2112 
2113 		srp_free_req(ch, req, scmnd,
2114 			     be32_to_cpu(rsp->req_lim_delta));
2115 
2116 		scmnd->host_scribble = NULL;
2117 		scmnd->scsi_done(scmnd);
2118 	}
2119 }
2120 
2121 static int srp_response_common(struct srp_rdma_ch *ch, s32 req_delta,
2122 			       void *rsp, int len)
2123 {
2124 	struct srp_target_port *target = ch->target;
2125 	struct ib_device *dev = target->srp_host->srp_dev->dev;
2126 	unsigned long flags;
2127 	struct srp_iu *iu;
2128 	int err;
2129 
2130 	spin_lock_irqsave(&ch->lock, flags);
2131 	ch->req_lim += req_delta;
2132 	iu = __srp_get_tx_iu(ch, SRP_IU_RSP);
2133 	spin_unlock_irqrestore(&ch->lock, flags);
2134 
2135 	if (!iu) {
2136 		shost_printk(KERN_ERR, target->scsi_host, PFX
2137 			     "no IU available to send response\n");
2138 		return 1;
2139 	}
2140 
2141 	ib_dma_sync_single_for_cpu(dev, iu->dma, len, DMA_TO_DEVICE);
2142 	memcpy(iu->buf, rsp, len);
2143 	ib_dma_sync_single_for_device(dev, iu->dma, len, DMA_TO_DEVICE);
2144 
2145 	err = srp_post_send(ch, iu, len);
2146 	if (err) {
2147 		shost_printk(KERN_ERR, target->scsi_host, PFX
2148 			     "unable to post response: %d\n", err);
2149 		srp_put_tx_iu(ch, iu, SRP_IU_RSP);
2150 	}
2151 
2152 	return err;
2153 }
2154 
2155 static void srp_process_cred_req(struct srp_rdma_ch *ch,
2156 				 struct srp_cred_req *req)
2157 {
2158 	struct srp_cred_rsp rsp = {
2159 		.opcode = SRP_CRED_RSP,
2160 		.tag = req->tag,
2161 	};
2162 	s32 delta = be32_to_cpu(req->req_lim_delta);
2163 
2164 	if (srp_response_common(ch, delta, &rsp, sizeof(rsp)))
2165 		shost_printk(KERN_ERR, ch->target->scsi_host, PFX
2166 			     "problems processing SRP_CRED_REQ\n");
2167 }
2168 
2169 static void srp_process_aer_req(struct srp_rdma_ch *ch,
2170 				struct srp_aer_req *req)
2171 {
2172 	struct srp_target_port *target = ch->target;
2173 	struct srp_aer_rsp rsp = {
2174 		.opcode = SRP_AER_RSP,
2175 		.tag = req->tag,
2176 	};
2177 	s32 delta = be32_to_cpu(req->req_lim_delta);
2178 
2179 	shost_printk(KERN_ERR, target->scsi_host, PFX
2180 		     "ignoring AER for LUN %llu\n", scsilun_to_int(&req->lun));
2181 
2182 	if (srp_response_common(ch, delta, &rsp, sizeof(rsp)))
2183 		shost_printk(KERN_ERR, target->scsi_host, PFX
2184 			     "problems processing SRP_AER_REQ\n");
2185 }
2186 
2187 static void srp_recv_done(struct ib_cq *cq, struct ib_wc *wc)
2188 {
2189 	struct srp_iu *iu = container_of(wc->wr_cqe, struct srp_iu, cqe);
2190 	struct srp_rdma_ch *ch = cq->cq_context;
2191 	struct srp_target_port *target = ch->target;
2192 	struct ib_device *dev = target->srp_host->srp_dev->dev;
2193 	int res;
2194 	u8 opcode;
2195 
2196 	if (unlikely(wc->status != IB_WC_SUCCESS)) {
2197 		srp_handle_qp_err(cq, wc, "RECV");
2198 		return;
2199 	}
2200 
2201 	ib_dma_sync_single_for_cpu(dev, iu->dma, ch->max_ti_iu_len,
2202 				   DMA_FROM_DEVICE);
2203 
2204 	opcode = *(u8 *) iu->buf;
2205 
2206 	if (0) {
2207 		shost_printk(KERN_ERR, target->scsi_host,
2208 			     PFX "recv completion, opcode 0x%02x\n", opcode);
2209 		print_hex_dump(KERN_ERR, "", DUMP_PREFIX_OFFSET, 8, 1,
2210 			       iu->buf, wc->byte_len, true);
2211 	}
2212 
2213 	switch (opcode) {
2214 	case SRP_RSP:
2215 		srp_process_rsp(ch, iu->buf);
2216 		break;
2217 
2218 	case SRP_CRED_REQ:
2219 		srp_process_cred_req(ch, iu->buf);
2220 		break;
2221 
2222 	case SRP_AER_REQ:
2223 		srp_process_aer_req(ch, iu->buf);
2224 		break;
2225 
2226 	case SRP_T_LOGOUT:
2227 		/* XXX Handle target logout */
2228 		shost_printk(KERN_WARNING, target->scsi_host,
2229 			     PFX "Got target logout request\n");
2230 		break;
2231 
2232 	default:
2233 		shost_printk(KERN_WARNING, target->scsi_host,
2234 			     PFX "Unhandled SRP opcode 0x%02x\n", opcode);
2235 		break;
2236 	}
2237 
2238 	ib_dma_sync_single_for_device(dev, iu->dma, ch->max_ti_iu_len,
2239 				      DMA_FROM_DEVICE);
2240 
2241 	res = srp_post_recv(ch, iu);
2242 	if (res != 0)
2243 		shost_printk(KERN_ERR, target->scsi_host,
2244 			     PFX "Recv failed with error code %d\n", res);
2245 }
2246 
2247 /**
2248  * srp_tl_err_work() - handle a transport layer error
2249  * @work: Work structure embedded in an SRP target port.
2250  *
2251  * Note: This function may get invoked before the rport has been created,
2252  * hence the target->rport test.
2253  */
2254 static void srp_tl_err_work(struct work_struct *work)
2255 {
2256 	struct srp_target_port *target;
2257 
2258 	target = container_of(work, struct srp_target_port, tl_err_work);
2259 	if (target->rport)
2260 		srp_start_tl_fail_timers(target->rport);
2261 }
2262 
2263 static void srp_handle_qp_err(struct ib_cq *cq, struct ib_wc *wc,
2264 		const char *opname)
2265 {
2266 	struct srp_rdma_ch *ch = cq->cq_context;
2267 	struct srp_target_port *target = ch->target;
2268 
2269 	if (ch->connected && !target->qp_in_error) {
2270 		shost_printk(KERN_ERR, target->scsi_host,
2271 			     PFX "failed %s status %s (%d) for CQE %p\n",
2272 			     opname, ib_wc_status_msg(wc->status), wc->status,
2273 			     wc->wr_cqe);
2274 		queue_work(system_long_wq, &target->tl_err_work);
2275 	}
2276 	target->qp_in_error = true;
2277 }
2278 
2279 static int srp_queuecommand(struct Scsi_Host *shost, struct scsi_cmnd *scmnd)
2280 {
2281 	struct srp_target_port *target = host_to_target(shost);
2282 	struct srp_rport *rport = target->rport;
2283 	struct srp_rdma_ch *ch;
2284 	struct srp_request *req;
2285 	struct srp_iu *iu;
2286 	struct srp_cmd *cmd;
2287 	struct ib_device *dev;
2288 	unsigned long flags;
2289 	u32 tag;
2290 	u16 idx;
2291 	int len, ret;
2292 	const bool in_scsi_eh = !in_interrupt() && current == shost->ehandler;
2293 
2294 	/*
2295 	 * The SCSI EH thread is the only context from which srp_queuecommand()
2296 	 * can get invoked for blocked devices (SDEV_BLOCK /
2297 	 * SDEV_CREATED_BLOCK). Avoid racing with srp_reconnect_rport() by
2298 	 * locking the rport mutex if invoked from inside the SCSI EH.
2299 	 */
2300 	if (in_scsi_eh)
2301 		mutex_lock(&rport->mutex);
2302 
2303 	scmnd->result = srp_chkready(target->rport);
2304 	if (unlikely(scmnd->result))
2305 		goto err;
2306 
2307 	WARN_ON_ONCE(scmnd->request->tag < 0);
2308 	tag = blk_mq_unique_tag(scmnd->request);
2309 	ch = &target->ch[blk_mq_unique_tag_to_hwq(tag)];
2310 	idx = blk_mq_unique_tag_to_tag(tag);
2311 	WARN_ONCE(idx >= target->req_ring_size, "%s: tag %#x: idx %d >= %d\n",
2312 		  dev_name(&shost->shost_gendev), tag, idx,
2313 		  target->req_ring_size);
2314 
2315 	spin_lock_irqsave(&ch->lock, flags);
2316 	iu = __srp_get_tx_iu(ch, SRP_IU_CMD);
2317 	spin_unlock_irqrestore(&ch->lock, flags);
2318 
2319 	if (!iu)
2320 		goto err;
2321 
2322 	req = &ch->req_ring[idx];
2323 	dev = target->srp_host->srp_dev->dev;
2324 	ib_dma_sync_single_for_cpu(dev, iu->dma, target->max_iu_len,
2325 				   DMA_TO_DEVICE);
2326 
2327 	scmnd->host_scribble = (void *) req;
2328 
2329 	cmd = iu->buf;
2330 	memset(cmd, 0, sizeof *cmd);
2331 
2332 	cmd->opcode = SRP_CMD;
2333 	int_to_scsilun(scmnd->device->lun, &cmd->lun);
2334 	cmd->tag    = tag;
2335 	memcpy(cmd->cdb, scmnd->cmnd, scmnd->cmd_len);
2336 
2337 	req->scmnd    = scmnd;
2338 	req->cmd      = iu;
2339 
2340 	len = srp_map_data(scmnd, ch, req);
2341 	if (len < 0) {
2342 		shost_printk(KERN_ERR, target->scsi_host,
2343 			     PFX "Failed to map data (%d)\n", len);
2344 		/*
2345 		 * If we ran out of memory descriptors (-ENOMEM) because an
2346 		 * application is queuing many requests with more than
2347 		 * max_pages_per_mr sg-list elements, tell the SCSI mid-layer
2348 		 * to reduce queue depth temporarily.
2349 		 */
2350 		scmnd->result = len == -ENOMEM ?
2351 			DID_OK << 16 | QUEUE_FULL << 1 : DID_ERROR << 16;
2352 		goto err_iu;
2353 	}
2354 
2355 	ib_dma_sync_single_for_device(dev, iu->dma, target->max_iu_len,
2356 				      DMA_TO_DEVICE);
2357 
2358 	if (srp_post_send(ch, iu, len)) {
2359 		shost_printk(KERN_ERR, target->scsi_host, PFX "Send failed\n");
2360 		goto err_unmap;
2361 	}
2362 
2363 	ret = 0;
2364 
2365 unlock_rport:
2366 	if (in_scsi_eh)
2367 		mutex_unlock(&rport->mutex);
2368 
2369 	return ret;
2370 
2371 err_unmap:
2372 	srp_unmap_data(scmnd, ch, req);
2373 
2374 err_iu:
2375 	srp_put_tx_iu(ch, iu, SRP_IU_CMD);
2376 
2377 	/*
2378 	 * Avoid that the loops that iterate over the request ring can
2379 	 * encounter a dangling SCSI command pointer.
2380 	 */
2381 	req->scmnd = NULL;
2382 
2383 err:
2384 	if (scmnd->result) {
2385 		scmnd->scsi_done(scmnd);
2386 		ret = 0;
2387 	} else {
2388 		ret = SCSI_MLQUEUE_HOST_BUSY;
2389 	}
2390 
2391 	goto unlock_rport;
2392 }
2393 
2394 /*
2395  * Note: the resources allocated in this function are freed in
2396  * srp_free_ch_ib().
2397  */
2398 static int srp_alloc_iu_bufs(struct srp_rdma_ch *ch)
2399 {
2400 	struct srp_target_port *target = ch->target;
2401 	int i;
2402 
2403 	ch->rx_ring = kcalloc(target->queue_size, sizeof(*ch->rx_ring),
2404 			      GFP_KERNEL);
2405 	if (!ch->rx_ring)
2406 		goto err_no_ring;
2407 	ch->tx_ring = kcalloc(target->queue_size, sizeof(*ch->tx_ring),
2408 			      GFP_KERNEL);
2409 	if (!ch->tx_ring)
2410 		goto err_no_ring;
2411 
2412 	for (i = 0; i < target->queue_size; ++i) {
2413 		ch->rx_ring[i] = srp_alloc_iu(target->srp_host,
2414 					      ch->max_ti_iu_len,
2415 					      GFP_KERNEL, DMA_FROM_DEVICE);
2416 		if (!ch->rx_ring[i])
2417 			goto err;
2418 	}
2419 
2420 	for (i = 0; i < target->queue_size; ++i) {
2421 		ch->tx_ring[i] = srp_alloc_iu(target->srp_host,
2422 					      target->max_iu_len,
2423 					      GFP_KERNEL, DMA_TO_DEVICE);
2424 		if (!ch->tx_ring[i])
2425 			goto err;
2426 
2427 		list_add(&ch->tx_ring[i]->list, &ch->free_tx);
2428 	}
2429 
2430 	return 0;
2431 
2432 err:
2433 	for (i = 0; i < target->queue_size; ++i) {
2434 		srp_free_iu(target->srp_host, ch->rx_ring[i]);
2435 		srp_free_iu(target->srp_host, ch->tx_ring[i]);
2436 	}
2437 
2438 
2439 err_no_ring:
2440 	kfree(ch->tx_ring);
2441 	ch->tx_ring = NULL;
2442 	kfree(ch->rx_ring);
2443 	ch->rx_ring = NULL;
2444 
2445 	return -ENOMEM;
2446 }
2447 
2448 static uint32_t srp_compute_rq_tmo(struct ib_qp_attr *qp_attr, int attr_mask)
2449 {
2450 	uint64_t T_tr_ns, max_compl_time_ms;
2451 	uint32_t rq_tmo_jiffies;
2452 
2453 	/*
2454 	 * According to section 11.2.4.2 in the IBTA spec (Modify Queue Pair,
2455 	 * table 91), both the QP timeout and the retry count have to be set
2456 	 * for RC QP's during the RTR to RTS transition.
2457 	 */
2458 	WARN_ON_ONCE((attr_mask & (IB_QP_TIMEOUT | IB_QP_RETRY_CNT)) !=
2459 		     (IB_QP_TIMEOUT | IB_QP_RETRY_CNT));
2460 
2461 	/*
2462 	 * Set target->rq_tmo_jiffies to one second more than the largest time
2463 	 * it can take before an error completion is generated. See also
2464 	 * C9-140..142 in the IBTA spec for more information about how to
2465 	 * convert the QP Local ACK Timeout value to nanoseconds.
2466 	 */
2467 	T_tr_ns = 4096 * (1ULL << qp_attr->timeout);
2468 	max_compl_time_ms = qp_attr->retry_cnt * 4 * T_tr_ns;
2469 	do_div(max_compl_time_ms, NSEC_PER_MSEC);
2470 	rq_tmo_jiffies = msecs_to_jiffies(max_compl_time_ms + 1000);
2471 
2472 	return rq_tmo_jiffies;
2473 }
2474 
2475 static void srp_cm_rep_handler(struct ib_cm_id *cm_id,
2476 			       const struct srp_login_rsp *lrsp,
2477 			       struct srp_rdma_ch *ch)
2478 {
2479 	struct srp_target_port *target = ch->target;
2480 	struct ib_qp_attr *qp_attr = NULL;
2481 	int attr_mask = 0;
2482 	int ret = 0;
2483 	int i;
2484 
2485 	if (lrsp->opcode == SRP_LOGIN_RSP) {
2486 		ch->max_ti_iu_len = be32_to_cpu(lrsp->max_ti_iu_len);
2487 		ch->req_lim       = be32_to_cpu(lrsp->req_lim_delta);
2488 
2489 		/*
2490 		 * Reserve credits for task management so we don't
2491 		 * bounce requests back to the SCSI mid-layer.
2492 		 */
2493 		target->scsi_host->can_queue
2494 			= min(ch->req_lim - SRP_TSK_MGMT_SQ_SIZE,
2495 			      target->scsi_host->can_queue);
2496 		target->scsi_host->cmd_per_lun
2497 			= min_t(int, target->scsi_host->can_queue,
2498 				target->scsi_host->cmd_per_lun);
2499 	} else {
2500 		shost_printk(KERN_WARNING, target->scsi_host,
2501 			     PFX "Unhandled RSP opcode %#x\n", lrsp->opcode);
2502 		ret = -ECONNRESET;
2503 		goto error;
2504 	}
2505 
2506 	if (!ch->rx_ring) {
2507 		ret = srp_alloc_iu_bufs(ch);
2508 		if (ret)
2509 			goto error;
2510 	}
2511 
2512 	for (i = 0; i < target->queue_size; i++) {
2513 		struct srp_iu *iu = ch->rx_ring[i];
2514 
2515 		ret = srp_post_recv(ch, iu);
2516 		if (ret)
2517 			goto error;
2518 	}
2519 
2520 	if (!target->using_rdma_cm) {
2521 		ret = -ENOMEM;
2522 		qp_attr = kmalloc(sizeof(*qp_attr), GFP_KERNEL);
2523 		if (!qp_attr)
2524 			goto error;
2525 
2526 		qp_attr->qp_state = IB_QPS_RTR;
2527 		ret = ib_cm_init_qp_attr(cm_id, qp_attr, &attr_mask);
2528 		if (ret)
2529 			goto error_free;
2530 
2531 		ret = ib_modify_qp(ch->qp, qp_attr, attr_mask);
2532 		if (ret)
2533 			goto error_free;
2534 
2535 		qp_attr->qp_state = IB_QPS_RTS;
2536 		ret = ib_cm_init_qp_attr(cm_id, qp_attr, &attr_mask);
2537 		if (ret)
2538 			goto error_free;
2539 
2540 		target->rq_tmo_jiffies = srp_compute_rq_tmo(qp_attr, attr_mask);
2541 
2542 		ret = ib_modify_qp(ch->qp, qp_attr, attr_mask);
2543 		if (ret)
2544 			goto error_free;
2545 
2546 		ret = ib_send_cm_rtu(cm_id, NULL, 0);
2547 	}
2548 
2549 error_free:
2550 	kfree(qp_attr);
2551 
2552 error:
2553 	ch->status = ret;
2554 }
2555 
2556 static void srp_ib_cm_rej_handler(struct ib_cm_id *cm_id,
2557 				  const struct ib_cm_event *event,
2558 				  struct srp_rdma_ch *ch)
2559 {
2560 	struct srp_target_port *target = ch->target;
2561 	struct Scsi_Host *shost = target->scsi_host;
2562 	struct ib_class_port_info *cpi;
2563 	int opcode;
2564 	u16 dlid;
2565 
2566 	switch (event->param.rej_rcvd.reason) {
2567 	case IB_CM_REJ_PORT_CM_REDIRECT:
2568 		cpi = event->param.rej_rcvd.ari;
2569 		dlid = be16_to_cpu(cpi->redirect_lid);
2570 		sa_path_set_dlid(&ch->ib_cm.path, dlid);
2571 		ch->ib_cm.path.pkey = cpi->redirect_pkey;
2572 		cm_id->remote_cm_qpn = be32_to_cpu(cpi->redirect_qp) & 0x00ffffff;
2573 		memcpy(ch->ib_cm.path.dgid.raw, cpi->redirect_gid, 16);
2574 
2575 		ch->status = dlid ? SRP_DLID_REDIRECT : SRP_PORT_REDIRECT;
2576 		break;
2577 
2578 	case IB_CM_REJ_PORT_REDIRECT:
2579 		if (srp_target_is_topspin(target)) {
2580 			union ib_gid *dgid = &ch->ib_cm.path.dgid;
2581 
2582 			/*
2583 			 * Topspin/Cisco SRP gateways incorrectly send
2584 			 * reject reason code 25 when they mean 24
2585 			 * (port redirect).
2586 			 */
2587 			memcpy(dgid->raw, event->param.rej_rcvd.ari, 16);
2588 
2589 			shost_printk(KERN_DEBUG, shost,
2590 				     PFX "Topspin/Cisco redirect to target port GID %016llx%016llx\n",
2591 				     be64_to_cpu(dgid->global.subnet_prefix),
2592 				     be64_to_cpu(dgid->global.interface_id));
2593 
2594 			ch->status = SRP_PORT_REDIRECT;
2595 		} else {
2596 			shost_printk(KERN_WARNING, shost,
2597 				     "  REJ reason: IB_CM_REJ_PORT_REDIRECT\n");
2598 			ch->status = -ECONNRESET;
2599 		}
2600 		break;
2601 
2602 	case IB_CM_REJ_DUPLICATE_LOCAL_COMM_ID:
2603 		shost_printk(KERN_WARNING, shost,
2604 			    "  REJ reason: IB_CM_REJ_DUPLICATE_LOCAL_COMM_ID\n");
2605 		ch->status = -ECONNRESET;
2606 		break;
2607 
2608 	case IB_CM_REJ_CONSUMER_DEFINED:
2609 		opcode = *(u8 *) event->private_data;
2610 		if (opcode == SRP_LOGIN_REJ) {
2611 			struct srp_login_rej *rej = event->private_data;
2612 			u32 reason = be32_to_cpu(rej->reason);
2613 
2614 			if (reason == SRP_LOGIN_REJ_REQ_IT_IU_LENGTH_TOO_LARGE)
2615 				shost_printk(KERN_WARNING, shost,
2616 					     PFX "SRP_LOGIN_REJ: requested max_it_iu_len too large\n");
2617 			else
2618 				shost_printk(KERN_WARNING, shost, PFX
2619 					     "SRP LOGIN from %pI6 to %pI6 REJECTED, reason 0x%08x\n",
2620 					     target->sgid.raw,
2621 					     target->ib_cm.orig_dgid.raw,
2622 					     reason);
2623 		} else
2624 			shost_printk(KERN_WARNING, shost,
2625 				     "  REJ reason: IB_CM_REJ_CONSUMER_DEFINED,"
2626 				     " opcode 0x%02x\n", opcode);
2627 		ch->status = -ECONNRESET;
2628 		break;
2629 
2630 	case IB_CM_REJ_STALE_CONN:
2631 		shost_printk(KERN_WARNING, shost, "  REJ reason: stale connection\n");
2632 		ch->status = SRP_STALE_CONN;
2633 		break;
2634 
2635 	default:
2636 		shost_printk(KERN_WARNING, shost, "  REJ reason 0x%x\n",
2637 			     event->param.rej_rcvd.reason);
2638 		ch->status = -ECONNRESET;
2639 	}
2640 }
2641 
2642 static int srp_ib_cm_handler(struct ib_cm_id *cm_id,
2643 			     const struct ib_cm_event *event)
2644 {
2645 	struct srp_rdma_ch *ch = cm_id->context;
2646 	struct srp_target_port *target = ch->target;
2647 	int comp = 0;
2648 
2649 	switch (event->event) {
2650 	case IB_CM_REQ_ERROR:
2651 		shost_printk(KERN_DEBUG, target->scsi_host,
2652 			     PFX "Sending CM REQ failed\n");
2653 		comp = 1;
2654 		ch->status = -ECONNRESET;
2655 		break;
2656 
2657 	case IB_CM_REP_RECEIVED:
2658 		comp = 1;
2659 		srp_cm_rep_handler(cm_id, event->private_data, ch);
2660 		break;
2661 
2662 	case IB_CM_REJ_RECEIVED:
2663 		shost_printk(KERN_DEBUG, target->scsi_host, PFX "REJ received\n");
2664 		comp = 1;
2665 
2666 		srp_ib_cm_rej_handler(cm_id, event, ch);
2667 		break;
2668 
2669 	case IB_CM_DREQ_RECEIVED:
2670 		shost_printk(KERN_WARNING, target->scsi_host,
2671 			     PFX "DREQ received - connection closed\n");
2672 		ch->connected = false;
2673 		if (ib_send_cm_drep(cm_id, NULL, 0))
2674 			shost_printk(KERN_ERR, target->scsi_host,
2675 				     PFX "Sending CM DREP failed\n");
2676 		queue_work(system_long_wq, &target->tl_err_work);
2677 		break;
2678 
2679 	case IB_CM_TIMEWAIT_EXIT:
2680 		shost_printk(KERN_ERR, target->scsi_host,
2681 			     PFX "connection closed\n");
2682 		comp = 1;
2683 
2684 		ch->status = 0;
2685 		break;
2686 
2687 	case IB_CM_MRA_RECEIVED:
2688 	case IB_CM_DREQ_ERROR:
2689 	case IB_CM_DREP_RECEIVED:
2690 		break;
2691 
2692 	default:
2693 		shost_printk(KERN_WARNING, target->scsi_host,
2694 			     PFX "Unhandled CM event %d\n", event->event);
2695 		break;
2696 	}
2697 
2698 	if (comp)
2699 		complete(&ch->done);
2700 
2701 	return 0;
2702 }
2703 
2704 static void srp_rdma_cm_rej_handler(struct srp_rdma_ch *ch,
2705 				    struct rdma_cm_event *event)
2706 {
2707 	struct srp_target_port *target = ch->target;
2708 	struct Scsi_Host *shost = target->scsi_host;
2709 	int opcode;
2710 
2711 	switch (event->status) {
2712 	case IB_CM_REJ_DUPLICATE_LOCAL_COMM_ID:
2713 		shost_printk(KERN_WARNING, shost,
2714 			    "  REJ reason: IB_CM_REJ_DUPLICATE_LOCAL_COMM_ID\n");
2715 		ch->status = -ECONNRESET;
2716 		break;
2717 
2718 	case IB_CM_REJ_CONSUMER_DEFINED:
2719 		opcode = *(u8 *) event->param.conn.private_data;
2720 		if (opcode == SRP_LOGIN_REJ) {
2721 			struct srp_login_rej *rej =
2722 				(struct srp_login_rej *)
2723 				event->param.conn.private_data;
2724 			u32 reason = be32_to_cpu(rej->reason);
2725 
2726 			if (reason == SRP_LOGIN_REJ_REQ_IT_IU_LENGTH_TOO_LARGE)
2727 				shost_printk(KERN_WARNING, shost,
2728 					     PFX "SRP_LOGIN_REJ: requested max_it_iu_len too large\n");
2729 			else
2730 				shost_printk(KERN_WARNING, shost,
2731 					    PFX "SRP LOGIN REJECTED, reason 0x%08x\n", reason);
2732 		} else {
2733 			shost_printk(KERN_WARNING, shost,
2734 				     "  REJ reason: IB_CM_REJ_CONSUMER_DEFINED, opcode 0x%02x\n",
2735 				     opcode);
2736 		}
2737 		ch->status = -ECONNRESET;
2738 		break;
2739 
2740 	case IB_CM_REJ_STALE_CONN:
2741 		shost_printk(KERN_WARNING, shost,
2742 			     "  REJ reason: stale connection\n");
2743 		ch->status = SRP_STALE_CONN;
2744 		break;
2745 
2746 	default:
2747 		shost_printk(KERN_WARNING, shost, "  REJ reason 0x%x\n",
2748 			     event->status);
2749 		ch->status = -ECONNRESET;
2750 		break;
2751 	}
2752 }
2753 
2754 static int srp_rdma_cm_handler(struct rdma_cm_id *cm_id,
2755 			       struct rdma_cm_event *event)
2756 {
2757 	struct srp_rdma_ch *ch = cm_id->context;
2758 	struct srp_target_port *target = ch->target;
2759 	int comp = 0;
2760 
2761 	switch (event->event) {
2762 	case RDMA_CM_EVENT_ADDR_RESOLVED:
2763 		ch->status = 0;
2764 		comp = 1;
2765 		break;
2766 
2767 	case RDMA_CM_EVENT_ADDR_ERROR:
2768 		ch->status = -ENXIO;
2769 		comp = 1;
2770 		break;
2771 
2772 	case RDMA_CM_EVENT_ROUTE_RESOLVED:
2773 		ch->status = 0;
2774 		comp = 1;
2775 		break;
2776 
2777 	case RDMA_CM_EVENT_ROUTE_ERROR:
2778 	case RDMA_CM_EVENT_UNREACHABLE:
2779 		ch->status = -EHOSTUNREACH;
2780 		comp = 1;
2781 		break;
2782 
2783 	case RDMA_CM_EVENT_CONNECT_ERROR:
2784 		shost_printk(KERN_DEBUG, target->scsi_host,
2785 			     PFX "Sending CM REQ failed\n");
2786 		comp = 1;
2787 		ch->status = -ECONNRESET;
2788 		break;
2789 
2790 	case RDMA_CM_EVENT_ESTABLISHED:
2791 		comp = 1;
2792 		srp_cm_rep_handler(NULL, event->param.conn.private_data, ch);
2793 		break;
2794 
2795 	case RDMA_CM_EVENT_REJECTED:
2796 		shost_printk(KERN_DEBUG, target->scsi_host, PFX "REJ received\n");
2797 		comp = 1;
2798 
2799 		srp_rdma_cm_rej_handler(ch, event);
2800 		break;
2801 
2802 	case RDMA_CM_EVENT_DISCONNECTED:
2803 		if (ch->connected) {
2804 			shost_printk(KERN_WARNING, target->scsi_host,
2805 				     PFX "received DREQ\n");
2806 			rdma_disconnect(ch->rdma_cm.cm_id);
2807 			comp = 1;
2808 			ch->status = 0;
2809 			queue_work(system_long_wq, &target->tl_err_work);
2810 		}
2811 		break;
2812 
2813 	case RDMA_CM_EVENT_TIMEWAIT_EXIT:
2814 		shost_printk(KERN_ERR, target->scsi_host,
2815 			     PFX "connection closed\n");
2816 
2817 		comp = 1;
2818 		ch->status = 0;
2819 		break;
2820 
2821 	default:
2822 		shost_printk(KERN_WARNING, target->scsi_host,
2823 			     PFX "Unhandled CM event %d\n", event->event);
2824 		break;
2825 	}
2826 
2827 	if (comp)
2828 		complete(&ch->done);
2829 
2830 	return 0;
2831 }
2832 
2833 /**
2834  * srp_change_queue_depth - setting device queue depth
2835  * @sdev: scsi device struct
2836  * @qdepth: requested queue depth
2837  *
2838  * Returns queue depth.
2839  */
2840 static int
2841 srp_change_queue_depth(struct scsi_device *sdev, int qdepth)
2842 {
2843 	if (!sdev->tagged_supported)
2844 		qdepth = 1;
2845 	return scsi_change_queue_depth(sdev, qdepth);
2846 }
2847 
2848 static int srp_send_tsk_mgmt(struct srp_rdma_ch *ch, u64 req_tag, u64 lun,
2849 			     u8 func, u8 *status)
2850 {
2851 	struct srp_target_port *target = ch->target;
2852 	struct srp_rport *rport = target->rport;
2853 	struct ib_device *dev = target->srp_host->srp_dev->dev;
2854 	struct srp_iu *iu;
2855 	struct srp_tsk_mgmt *tsk_mgmt;
2856 	int res;
2857 
2858 	if (!ch->connected || target->qp_in_error)
2859 		return -1;
2860 
2861 	/*
2862 	 * Lock the rport mutex to avoid that srp_create_ch_ib() is
2863 	 * invoked while a task management function is being sent.
2864 	 */
2865 	mutex_lock(&rport->mutex);
2866 	spin_lock_irq(&ch->lock);
2867 	iu = __srp_get_tx_iu(ch, SRP_IU_TSK_MGMT);
2868 	spin_unlock_irq(&ch->lock);
2869 
2870 	if (!iu) {
2871 		mutex_unlock(&rport->mutex);
2872 
2873 		return -1;
2874 	}
2875 
2876 	ib_dma_sync_single_for_cpu(dev, iu->dma, sizeof *tsk_mgmt,
2877 				   DMA_TO_DEVICE);
2878 	tsk_mgmt = iu->buf;
2879 	memset(tsk_mgmt, 0, sizeof *tsk_mgmt);
2880 
2881 	tsk_mgmt->opcode 	= SRP_TSK_MGMT;
2882 	int_to_scsilun(lun, &tsk_mgmt->lun);
2883 	tsk_mgmt->tsk_mgmt_func = func;
2884 	tsk_mgmt->task_tag	= req_tag;
2885 
2886 	spin_lock_irq(&ch->lock);
2887 	ch->tsk_mgmt_tag = (ch->tsk_mgmt_tag + 1) | SRP_TAG_TSK_MGMT;
2888 	tsk_mgmt->tag = ch->tsk_mgmt_tag;
2889 	spin_unlock_irq(&ch->lock);
2890 
2891 	init_completion(&ch->tsk_mgmt_done);
2892 
2893 	ib_dma_sync_single_for_device(dev, iu->dma, sizeof *tsk_mgmt,
2894 				      DMA_TO_DEVICE);
2895 	if (srp_post_send(ch, iu, sizeof(*tsk_mgmt))) {
2896 		srp_put_tx_iu(ch, iu, SRP_IU_TSK_MGMT);
2897 		mutex_unlock(&rport->mutex);
2898 
2899 		return -1;
2900 	}
2901 	res = wait_for_completion_timeout(&ch->tsk_mgmt_done,
2902 					msecs_to_jiffies(SRP_ABORT_TIMEOUT_MS));
2903 	if (res > 0 && status)
2904 		*status = ch->tsk_mgmt_status;
2905 	mutex_unlock(&rport->mutex);
2906 
2907 	WARN_ON_ONCE(res < 0);
2908 
2909 	return res > 0 ? 0 : -1;
2910 }
2911 
2912 static int srp_abort(struct scsi_cmnd *scmnd)
2913 {
2914 	struct srp_target_port *target = host_to_target(scmnd->device->host);
2915 	struct srp_request *req = (struct srp_request *) scmnd->host_scribble;
2916 	u32 tag;
2917 	u16 ch_idx;
2918 	struct srp_rdma_ch *ch;
2919 	int ret;
2920 
2921 	shost_printk(KERN_ERR, target->scsi_host, "SRP abort called\n");
2922 
2923 	if (!req)
2924 		return SUCCESS;
2925 	tag = blk_mq_unique_tag(scmnd->request);
2926 	ch_idx = blk_mq_unique_tag_to_hwq(tag);
2927 	if (WARN_ON_ONCE(ch_idx >= target->ch_count))
2928 		return SUCCESS;
2929 	ch = &target->ch[ch_idx];
2930 	if (!srp_claim_req(ch, req, NULL, scmnd))
2931 		return SUCCESS;
2932 	shost_printk(KERN_ERR, target->scsi_host,
2933 		     "Sending SRP abort for tag %#x\n", tag);
2934 	if (srp_send_tsk_mgmt(ch, tag, scmnd->device->lun,
2935 			      SRP_TSK_ABORT_TASK, NULL) == 0)
2936 		ret = SUCCESS;
2937 	else if (target->rport->state == SRP_RPORT_LOST)
2938 		ret = FAST_IO_FAIL;
2939 	else
2940 		ret = FAILED;
2941 	if (ret == SUCCESS) {
2942 		srp_free_req(ch, req, scmnd, 0);
2943 		scmnd->result = DID_ABORT << 16;
2944 		scmnd->scsi_done(scmnd);
2945 	}
2946 
2947 	return ret;
2948 }
2949 
2950 static int srp_reset_device(struct scsi_cmnd *scmnd)
2951 {
2952 	struct srp_target_port *target = host_to_target(scmnd->device->host);
2953 	struct srp_rdma_ch *ch;
2954 	int i;
2955 	u8 status;
2956 
2957 	shost_printk(KERN_ERR, target->scsi_host, "SRP reset_device called\n");
2958 
2959 	ch = &target->ch[0];
2960 	if (srp_send_tsk_mgmt(ch, SRP_TAG_NO_REQ, scmnd->device->lun,
2961 			      SRP_TSK_LUN_RESET, &status))
2962 		return FAILED;
2963 	if (status)
2964 		return FAILED;
2965 
2966 	for (i = 0; i < target->ch_count; i++) {
2967 		ch = &target->ch[i];
2968 		for (i = 0; i < target->req_ring_size; ++i) {
2969 			struct srp_request *req = &ch->req_ring[i];
2970 
2971 			srp_finish_req(ch, req, scmnd->device, DID_RESET << 16);
2972 		}
2973 	}
2974 
2975 	return SUCCESS;
2976 }
2977 
2978 static int srp_reset_host(struct scsi_cmnd *scmnd)
2979 {
2980 	struct srp_target_port *target = host_to_target(scmnd->device->host);
2981 
2982 	shost_printk(KERN_ERR, target->scsi_host, PFX "SRP reset_host called\n");
2983 
2984 	return srp_reconnect_rport(target->rport) == 0 ? SUCCESS : FAILED;
2985 }
2986 
2987 static int srp_target_alloc(struct scsi_target *starget)
2988 {
2989 	struct Scsi_Host *shost = dev_to_shost(starget->dev.parent);
2990 	struct srp_target_port *target = host_to_target(shost);
2991 
2992 	if (target->target_can_queue)
2993 		starget->can_queue = target->target_can_queue;
2994 	return 0;
2995 }
2996 
2997 static int srp_slave_alloc(struct scsi_device *sdev)
2998 {
2999 	struct Scsi_Host *shost = sdev->host;
3000 	struct srp_target_port *target = host_to_target(shost);
3001 	struct srp_device *srp_dev = target->srp_host->srp_dev;
3002 	struct ib_device *ibdev = srp_dev->dev;
3003 
3004 	if (!(ibdev->attrs.device_cap_flags & IB_DEVICE_SG_GAPS_REG))
3005 		blk_queue_virt_boundary(sdev->request_queue,
3006 					~srp_dev->mr_page_mask);
3007 
3008 	return 0;
3009 }
3010 
3011 static int srp_slave_configure(struct scsi_device *sdev)
3012 {
3013 	struct Scsi_Host *shost = sdev->host;
3014 	struct srp_target_port *target = host_to_target(shost);
3015 	struct request_queue *q = sdev->request_queue;
3016 	unsigned long timeout;
3017 
3018 	if (sdev->type == TYPE_DISK) {
3019 		timeout = max_t(unsigned, 30 * HZ, target->rq_tmo_jiffies);
3020 		blk_queue_rq_timeout(q, timeout);
3021 	}
3022 
3023 	return 0;
3024 }
3025 
3026 static ssize_t show_id_ext(struct device *dev, struct device_attribute *attr,
3027 			   char *buf)
3028 {
3029 	struct srp_target_port *target = host_to_target(class_to_shost(dev));
3030 
3031 	return sprintf(buf, "0x%016llx\n", be64_to_cpu(target->id_ext));
3032 }
3033 
3034 static ssize_t show_ioc_guid(struct device *dev, struct device_attribute *attr,
3035 			     char *buf)
3036 {
3037 	struct srp_target_port *target = host_to_target(class_to_shost(dev));
3038 
3039 	return sprintf(buf, "0x%016llx\n", be64_to_cpu(target->ioc_guid));
3040 }
3041 
3042 static ssize_t show_service_id(struct device *dev,
3043 			       struct device_attribute *attr, char *buf)
3044 {
3045 	struct srp_target_port *target = host_to_target(class_to_shost(dev));
3046 
3047 	if (target->using_rdma_cm)
3048 		return -ENOENT;
3049 	return sprintf(buf, "0x%016llx\n",
3050 		       be64_to_cpu(target->ib_cm.service_id));
3051 }
3052 
3053 static ssize_t show_pkey(struct device *dev, struct device_attribute *attr,
3054 			 char *buf)
3055 {
3056 	struct srp_target_port *target = host_to_target(class_to_shost(dev));
3057 
3058 	if (target->using_rdma_cm)
3059 		return -ENOENT;
3060 	return sprintf(buf, "0x%04x\n", be16_to_cpu(target->ib_cm.pkey));
3061 }
3062 
3063 static ssize_t show_sgid(struct device *dev, struct device_attribute *attr,
3064 			 char *buf)
3065 {
3066 	struct srp_target_port *target = host_to_target(class_to_shost(dev));
3067 
3068 	return sprintf(buf, "%pI6\n", target->sgid.raw);
3069 }
3070 
3071 static ssize_t show_dgid(struct device *dev, struct device_attribute *attr,
3072 			 char *buf)
3073 {
3074 	struct srp_target_port *target = host_to_target(class_to_shost(dev));
3075 	struct srp_rdma_ch *ch = &target->ch[0];
3076 
3077 	if (target->using_rdma_cm)
3078 		return -ENOENT;
3079 	return sprintf(buf, "%pI6\n", ch->ib_cm.path.dgid.raw);
3080 }
3081 
3082 static ssize_t show_orig_dgid(struct device *dev,
3083 			      struct device_attribute *attr, char *buf)
3084 {
3085 	struct srp_target_port *target = host_to_target(class_to_shost(dev));
3086 
3087 	if (target->using_rdma_cm)
3088 		return -ENOENT;
3089 	return sprintf(buf, "%pI6\n", target->ib_cm.orig_dgid.raw);
3090 }
3091 
3092 static ssize_t show_req_lim(struct device *dev,
3093 			    struct device_attribute *attr, char *buf)
3094 {
3095 	struct srp_target_port *target = host_to_target(class_to_shost(dev));
3096 	struct srp_rdma_ch *ch;
3097 	int i, req_lim = INT_MAX;
3098 
3099 	for (i = 0; i < target->ch_count; i++) {
3100 		ch = &target->ch[i];
3101 		req_lim = min(req_lim, ch->req_lim);
3102 	}
3103 	return sprintf(buf, "%d\n", req_lim);
3104 }
3105 
3106 static ssize_t show_zero_req_lim(struct device *dev,
3107 				 struct device_attribute *attr, char *buf)
3108 {
3109 	struct srp_target_port *target = host_to_target(class_to_shost(dev));
3110 
3111 	return sprintf(buf, "%d\n", target->zero_req_lim);
3112 }
3113 
3114 static ssize_t show_local_ib_port(struct device *dev,
3115 				  struct device_attribute *attr, char *buf)
3116 {
3117 	struct srp_target_port *target = host_to_target(class_to_shost(dev));
3118 
3119 	return sprintf(buf, "%d\n", target->srp_host->port);
3120 }
3121 
3122 static ssize_t show_local_ib_device(struct device *dev,
3123 				    struct device_attribute *attr, char *buf)
3124 {
3125 	struct srp_target_port *target = host_to_target(class_to_shost(dev));
3126 
3127 	return sprintf(buf, "%s\n", target->srp_host->srp_dev->dev->name);
3128 }
3129 
3130 static ssize_t show_ch_count(struct device *dev, struct device_attribute *attr,
3131 			     char *buf)
3132 {
3133 	struct srp_target_port *target = host_to_target(class_to_shost(dev));
3134 
3135 	return sprintf(buf, "%d\n", target->ch_count);
3136 }
3137 
3138 static ssize_t show_comp_vector(struct device *dev,
3139 				struct device_attribute *attr, char *buf)
3140 {
3141 	struct srp_target_port *target = host_to_target(class_to_shost(dev));
3142 
3143 	return sprintf(buf, "%d\n", target->comp_vector);
3144 }
3145 
3146 static ssize_t show_tl_retry_count(struct device *dev,
3147 				   struct device_attribute *attr, char *buf)
3148 {
3149 	struct srp_target_port *target = host_to_target(class_to_shost(dev));
3150 
3151 	return sprintf(buf, "%d\n", target->tl_retry_count);
3152 }
3153 
3154 static ssize_t show_cmd_sg_entries(struct device *dev,
3155 				   struct device_attribute *attr, char *buf)
3156 {
3157 	struct srp_target_port *target = host_to_target(class_to_shost(dev));
3158 
3159 	return sprintf(buf, "%u\n", target->cmd_sg_cnt);
3160 }
3161 
3162 static ssize_t show_allow_ext_sg(struct device *dev,
3163 				 struct device_attribute *attr, char *buf)
3164 {
3165 	struct srp_target_port *target = host_to_target(class_to_shost(dev));
3166 
3167 	return sprintf(buf, "%s\n", target->allow_ext_sg ? "true" : "false");
3168 }
3169 
3170 static DEVICE_ATTR(id_ext,	    S_IRUGO, show_id_ext,	   NULL);
3171 static DEVICE_ATTR(ioc_guid,	    S_IRUGO, show_ioc_guid,	   NULL);
3172 static DEVICE_ATTR(service_id,	    S_IRUGO, show_service_id,	   NULL);
3173 static DEVICE_ATTR(pkey,	    S_IRUGO, show_pkey,		   NULL);
3174 static DEVICE_ATTR(sgid,	    S_IRUGO, show_sgid,		   NULL);
3175 static DEVICE_ATTR(dgid,	    S_IRUGO, show_dgid,		   NULL);
3176 static DEVICE_ATTR(orig_dgid,	    S_IRUGO, show_orig_dgid,	   NULL);
3177 static DEVICE_ATTR(req_lim,         S_IRUGO, show_req_lim,         NULL);
3178 static DEVICE_ATTR(zero_req_lim,    S_IRUGO, show_zero_req_lim,	   NULL);
3179 static DEVICE_ATTR(local_ib_port,   S_IRUGO, show_local_ib_port,   NULL);
3180 static DEVICE_ATTR(local_ib_device, S_IRUGO, show_local_ib_device, NULL);
3181 static DEVICE_ATTR(ch_count,        S_IRUGO, show_ch_count,        NULL);
3182 static DEVICE_ATTR(comp_vector,     S_IRUGO, show_comp_vector,     NULL);
3183 static DEVICE_ATTR(tl_retry_count,  S_IRUGO, show_tl_retry_count,  NULL);
3184 static DEVICE_ATTR(cmd_sg_entries,  S_IRUGO, show_cmd_sg_entries,  NULL);
3185 static DEVICE_ATTR(allow_ext_sg,    S_IRUGO, show_allow_ext_sg,    NULL);
3186 
3187 static struct device_attribute *srp_host_attrs[] = {
3188 	&dev_attr_id_ext,
3189 	&dev_attr_ioc_guid,
3190 	&dev_attr_service_id,
3191 	&dev_attr_pkey,
3192 	&dev_attr_sgid,
3193 	&dev_attr_dgid,
3194 	&dev_attr_orig_dgid,
3195 	&dev_attr_req_lim,
3196 	&dev_attr_zero_req_lim,
3197 	&dev_attr_local_ib_port,
3198 	&dev_attr_local_ib_device,
3199 	&dev_attr_ch_count,
3200 	&dev_attr_comp_vector,
3201 	&dev_attr_tl_retry_count,
3202 	&dev_attr_cmd_sg_entries,
3203 	&dev_attr_allow_ext_sg,
3204 	NULL
3205 };
3206 
3207 static struct scsi_host_template srp_template = {
3208 	.module				= THIS_MODULE,
3209 	.name				= "InfiniBand SRP initiator",
3210 	.proc_name			= DRV_NAME,
3211 	.target_alloc			= srp_target_alloc,
3212 	.slave_alloc			= srp_slave_alloc,
3213 	.slave_configure		= srp_slave_configure,
3214 	.info				= srp_target_info,
3215 	.queuecommand			= srp_queuecommand,
3216 	.change_queue_depth             = srp_change_queue_depth,
3217 	.eh_timed_out			= srp_timed_out,
3218 	.eh_abort_handler		= srp_abort,
3219 	.eh_device_reset_handler	= srp_reset_device,
3220 	.eh_host_reset_handler		= srp_reset_host,
3221 	.skip_settle_delay		= true,
3222 	.sg_tablesize			= SRP_DEF_SG_TABLESIZE,
3223 	.can_queue			= SRP_DEFAULT_CMD_SQ_SIZE,
3224 	.this_id			= -1,
3225 	.cmd_per_lun			= SRP_DEFAULT_CMD_SQ_SIZE,
3226 	.use_clustering			= ENABLE_CLUSTERING,
3227 	.shost_attrs			= srp_host_attrs,
3228 	.track_queue_depth		= 1,
3229 };
3230 
3231 static int srp_sdev_count(struct Scsi_Host *host)
3232 {
3233 	struct scsi_device *sdev;
3234 	int c = 0;
3235 
3236 	shost_for_each_device(sdev, host)
3237 		c++;
3238 
3239 	return c;
3240 }
3241 
3242 /*
3243  * Return values:
3244  * < 0 upon failure. Caller is responsible for SRP target port cleanup.
3245  * 0 and target->state == SRP_TARGET_REMOVED if asynchronous target port
3246  *    removal has been scheduled.
3247  * 0 and target->state != SRP_TARGET_REMOVED upon success.
3248  */
3249 static int srp_add_target(struct srp_host *host, struct srp_target_port *target)
3250 {
3251 	struct srp_rport_identifiers ids;
3252 	struct srp_rport *rport;
3253 
3254 	target->state = SRP_TARGET_SCANNING;
3255 	sprintf(target->target_name, "SRP.T10:%016llX",
3256 		be64_to_cpu(target->id_ext));
3257 
3258 	if (scsi_add_host(target->scsi_host, host->srp_dev->dev->dev.parent))
3259 		return -ENODEV;
3260 
3261 	memcpy(ids.port_id, &target->id_ext, 8);
3262 	memcpy(ids.port_id + 8, &target->ioc_guid, 8);
3263 	ids.roles = SRP_RPORT_ROLE_TARGET;
3264 	rport = srp_rport_add(target->scsi_host, &ids);
3265 	if (IS_ERR(rport)) {
3266 		scsi_remove_host(target->scsi_host);
3267 		return PTR_ERR(rport);
3268 	}
3269 
3270 	rport->lld_data = target;
3271 	target->rport = rport;
3272 
3273 	spin_lock(&host->target_lock);
3274 	list_add_tail(&target->list, &host->target_list);
3275 	spin_unlock(&host->target_lock);
3276 
3277 	scsi_scan_target(&target->scsi_host->shost_gendev,
3278 			 0, target->scsi_id, SCAN_WILD_CARD, SCSI_SCAN_INITIAL);
3279 
3280 	if (srp_connected_ch(target) < target->ch_count ||
3281 	    target->qp_in_error) {
3282 		shost_printk(KERN_INFO, target->scsi_host,
3283 			     PFX "SCSI scan failed - removing SCSI host\n");
3284 		srp_queue_remove_work(target);
3285 		goto out;
3286 	}
3287 
3288 	pr_debug("%s: SCSI scan succeeded - detected %d LUNs\n",
3289 		 dev_name(&target->scsi_host->shost_gendev),
3290 		 srp_sdev_count(target->scsi_host));
3291 
3292 	spin_lock_irq(&target->lock);
3293 	if (target->state == SRP_TARGET_SCANNING)
3294 		target->state = SRP_TARGET_LIVE;
3295 	spin_unlock_irq(&target->lock);
3296 
3297 out:
3298 	return 0;
3299 }
3300 
3301 static void srp_release_dev(struct device *dev)
3302 {
3303 	struct srp_host *host =
3304 		container_of(dev, struct srp_host, dev);
3305 
3306 	complete(&host->released);
3307 }
3308 
3309 static struct class srp_class = {
3310 	.name    = "infiniband_srp",
3311 	.dev_release = srp_release_dev
3312 };
3313 
3314 /**
3315  * srp_conn_unique() - check whether the connection to a target is unique
3316  * @host:   SRP host.
3317  * @target: SRP target port.
3318  */
3319 static bool srp_conn_unique(struct srp_host *host,
3320 			    struct srp_target_port *target)
3321 {
3322 	struct srp_target_port *t;
3323 	bool ret = false;
3324 
3325 	if (target->state == SRP_TARGET_REMOVED)
3326 		goto out;
3327 
3328 	ret = true;
3329 
3330 	spin_lock(&host->target_lock);
3331 	list_for_each_entry(t, &host->target_list, list) {
3332 		if (t != target &&
3333 		    target->id_ext == t->id_ext &&
3334 		    target->ioc_guid == t->ioc_guid &&
3335 		    target->initiator_ext == t->initiator_ext) {
3336 			ret = false;
3337 			break;
3338 		}
3339 	}
3340 	spin_unlock(&host->target_lock);
3341 
3342 out:
3343 	return ret;
3344 }
3345 
3346 /*
3347  * Target ports are added by writing
3348  *
3349  *     id_ext=<SRP ID ext>,ioc_guid=<SRP IOC GUID>,dgid=<dest GID>,
3350  *     pkey=<P_Key>,service_id=<service ID>
3351  * or
3352  *     id_ext=<SRP ID ext>,ioc_guid=<SRP IOC GUID>,
3353  *     [src=<IPv4 address>,]dest=<IPv4 address>:<port number>
3354  *
3355  * to the add_target sysfs attribute.
3356  */
3357 enum {
3358 	SRP_OPT_ERR		= 0,
3359 	SRP_OPT_ID_EXT		= 1 << 0,
3360 	SRP_OPT_IOC_GUID	= 1 << 1,
3361 	SRP_OPT_DGID		= 1 << 2,
3362 	SRP_OPT_PKEY		= 1 << 3,
3363 	SRP_OPT_SERVICE_ID	= 1 << 4,
3364 	SRP_OPT_MAX_SECT	= 1 << 5,
3365 	SRP_OPT_MAX_CMD_PER_LUN	= 1 << 6,
3366 	SRP_OPT_IO_CLASS	= 1 << 7,
3367 	SRP_OPT_INITIATOR_EXT	= 1 << 8,
3368 	SRP_OPT_CMD_SG_ENTRIES	= 1 << 9,
3369 	SRP_OPT_ALLOW_EXT_SG	= 1 << 10,
3370 	SRP_OPT_SG_TABLESIZE	= 1 << 11,
3371 	SRP_OPT_COMP_VECTOR	= 1 << 12,
3372 	SRP_OPT_TL_RETRY_COUNT	= 1 << 13,
3373 	SRP_OPT_QUEUE_SIZE	= 1 << 14,
3374 	SRP_OPT_IP_SRC		= 1 << 15,
3375 	SRP_OPT_IP_DEST		= 1 << 16,
3376 	SRP_OPT_TARGET_CAN_QUEUE= 1 << 17,
3377 };
3378 
3379 static unsigned int srp_opt_mandatory[] = {
3380 	SRP_OPT_ID_EXT		|
3381 	SRP_OPT_IOC_GUID	|
3382 	SRP_OPT_DGID		|
3383 	SRP_OPT_PKEY		|
3384 	SRP_OPT_SERVICE_ID,
3385 	SRP_OPT_ID_EXT		|
3386 	SRP_OPT_IOC_GUID	|
3387 	SRP_OPT_IP_DEST,
3388 };
3389 
3390 static const match_table_t srp_opt_tokens = {
3391 	{ SRP_OPT_ID_EXT,		"id_ext=%s" 		},
3392 	{ SRP_OPT_IOC_GUID,		"ioc_guid=%s" 		},
3393 	{ SRP_OPT_DGID,			"dgid=%s" 		},
3394 	{ SRP_OPT_PKEY,			"pkey=%x" 		},
3395 	{ SRP_OPT_SERVICE_ID,		"service_id=%s"		},
3396 	{ SRP_OPT_MAX_SECT,		"max_sect=%d" 		},
3397 	{ SRP_OPT_MAX_CMD_PER_LUN,	"max_cmd_per_lun=%d" 	},
3398 	{ SRP_OPT_TARGET_CAN_QUEUE,	"target_can_queue=%d"	},
3399 	{ SRP_OPT_IO_CLASS,		"io_class=%x"		},
3400 	{ SRP_OPT_INITIATOR_EXT,	"initiator_ext=%s"	},
3401 	{ SRP_OPT_CMD_SG_ENTRIES,	"cmd_sg_entries=%u"	},
3402 	{ SRP_OPT_ALLOW_EXT_SG,		"allow_ext_sg=%u"	},
3403 	{ SRP_OPT_SG_TABLESIZE,		"sg_tablesize=%u"	},
3404 	{ SRP_OPT_COMP_VECTOR,		"comp_vector=%u"	},
3405 	{ SRP_OPT_TL_RETRY_COUNT,	"tl_retry_count=%u"	},
3406 	{ SRP_OPT_QUEUE_SIZE,		"queue_size=%d"		},
3407 	{ SRP_OPT_IP_SRC,		"src=%s"		},
3408 	{ SRP_OPT_IP_DEST,		"dest=%s"		},
3409 	{ SRP_OPT_ERR,			NULL 			}
3410 };
3411 
3412 /**
3413  * srp_parse_in - parse an IP address and port number combination
3414  *
3415  * Parse the following address formats:
3416  * - IPv4: <ip_address>:<port>, e.g. 1.2.3.4:5.
3417  * - IPv6: \[<ipv6_address>\]:<port>, e.g. [1::2:3%4]:5.
3418  */
3419 static int srp_parse_in(struct net *net, struct sockaddr_storage *sa,
3420 			const char *addr_port_str)
3421 {
3422 	char *addr_end, *addr = kstrdup(addr_port_str, GFP_KERNEL);
3423 	char *port_str;
3424 	int ret;
3425 
3426 	if (!addr)
3427 		return -ENOMEM;
3428 	port_str = strrchr(addr, ':');
3429 	if (!port_str)
3430 		return -EINVAL;
3431 	*port_str++ = '\0';
3432 	ret = inet_pton_with_scope(net, AF_INET, addr, port_str, sa);
3433 	if (ret && addr[0]) {
3434 		addr_end = addr + strlen(addr) - 1;
3435 		if (addr[0] == '[' && *addr_end == ']') {
3436 			*addr_end = '\0';
3437 			ret = inet_pton_with_scope(net, AF_INET6, addr + 1,
3438 						   port_str, sa);
3439 		}
3440 	}
3441 	kfree(addr);
3442 	pr_debug("%s -> %pISpfsc\n", addr_port_str, sa);
3443 	return ret;
3444 }
3445 
3446 static int srp_parse_options(struct net *net, const char *buf,
3447 			     struct srp_target_port *target)
3448 {
3449 	char *options, *sep_opt;
3450 	char *p;
3451 	substring_t args[MAX_OPT_ARGS];
3452 	unsigned long long ull;
3453 	int opt_mask = 0;
3454 	int token;
3455 	int ret = -EINVAL;
3456 	int i;
3457 
3458 	options = kstrdup(buf, GFP_KERNEL);
3459 	if (!options)
3460 		return -ENOMEM;
3461 
3462 	sep_opt = options;
3463 	while ((p = strsep(&sep_opt, ",\n")) != NULL) {
3464 		if (!*p)
3465 			continue;
3466 
3467 		token = match_token(p, srp_opt_tokens, args);
3468 		opt_mask |= token;
3469 
3470 		switch (token) {
3471 		case SRP_OPT_ID_EXT:
3472 			p = match_strdup(args);
3473 			if (!p) {
3474 				ret = -ENOMEM;
3475 				goto out;
3476 			}
3477 			ret = kstrtoull(p, 16, &ull);
3478 			if (ret) {
3479 				pr_warn("invalid id_ext parameter '%s'\n", p);
3480 				kfree(p);
3481 				goto out;
3482 			}
3483 			target->id_ext = cpu_to_be64(ull);
3484 			kfree(p);
3485 			break;
3486 
3487 		case SRP_OPT_IOC_GUID:
3488 			p = match_strdup(args);
3489 			if (!p) {
3490 				ret = -ENOMEM;
3491 				goto out;
3492 			}
3493 			ret = kstrtoull(p, 16, &ull);
3494 			if (ret) {
3495 				pr_warn("invalid ioc_guid parameter '%s'\n", p);
3496 				kfree(p);
3497 				goto out;
3498 			}
3499 			target->ioc_guid = cpu_to_be64(ull);
3500 			kfree(p);
3501 			break;
3502 
3503 		case SRP_OPT_DGID:
3504 			p = match_strdup(args);
3505 			if (!p) {
3506 				ret = -ENOMEM;
3507 				goto out;
3508 			}
3509 			if (strlen(p) != 32) {
3510 				pr_warn("bad dest GID parameter '%s'\n", p);
3511 				kfree(p);
3512 				goto out;
3513 			}
3514 
3515 			ret = hex2bin(target->ib_cm.orig_dgid.raw, p, 16);
3516 			kfree(p);
3517 			if (ret < 0)
3518 				goto out;
3519 			break;
3520 
3521 		case SRP_OPT_PKEY:
3522 			if (match_hex(args, &token)) {
3523 				pr_warn("bad P_Key parameter '%s'\n", p);
3524 				goto out;
3525 			}
3526 			target->ib_cm.pkey = cpu_to_be16(token);
3527 			break;
3528 
3529 		case SRP_OPT_SERVICE_ID:
3530 			p = match_strdup(args);
3531 			if (!p) {
3532 				ret = -ENOMEM;
3533 				goto out;
3534 			}
3535 			ret = kstrtoull(p, 16, &ull);
3536 			if (ret) {
3537 				pr_warn("bad service_id parameter '%s'\n", p);
3538 				kfree(p);
3539 				goto out;
3540 			}
3541 			target->ib_cm.service_id = cpu_to_be64(ull);
3542 			kfree(p);
3543 			break;
3544 
3545 		case SRP_OPT_IP_SRC:
3546 			p = match_strdup(args);
3547 			if (!p) {
3548 				ret = -ENOMEM;
3549 				goto out;
3550 			}
3551 			ret = srp_parse_in(net, &target->rdma_cm.src.ss, p);
3552 			if (ret < 0) {
3553 				pr_warn("bad source parameter '%s'\n", p);
3554 				kfree(p);
3555 				goto out;
3556 			}
3557 			target->rdma_cm.src_specified = true;
3558 			kfree(p);
3559 			break;
3560 
3561 		case SRP_OPT_IP_DEST:
3562 			p = match_strdup(args);
3563 			if (!p) {
3564 				ret = -ENOMEM;
3565 				goto out;
3566 			}
3567 			ret = srp_parse_in(net, &target->rdma_cm.dst.ss, p);
3568 			if (ret < 0) {
3569 				pr_warn("bad dest parameter '%s'\n", p);
3570 				kfree(p);
3571 				goto out;
3572 			}
3573 			target->using_rdma_cm = true;
3574 			kfree(p);
3575 			break;
3576 
3577 		case SRP_OPT_MAX_SECT:
3578 			if (match_int(args, &token)) {
3579 				pr_warn("bad max sect parameter '%s'\n", p);
3580 				goto out;
3581 			}
3582 			target->scsi_host->max_sectors = token;
3583 			break;
3584 
3585 		case SRP_OPT_QUEUE_SIZE:
3586 			if (match_int(args, &token) || token < 1) {
3587 				pr_warn("bad queue_size parameter '%s'\n", p);
3588 				goto out;
3589 			}
3590 			target->scsi_host->can_queue = token;
3591 			target->queue_size = token + SRP_RSP_SQ_SIZE +
3592 					     SRP_TSK_MGMT_SQ_SIZE;
3593 			if (!(opt_mask & SRP_OPT_MAX_CMD_PER_LUN))
3594 				target->scsi_host->cmd_per_lun = token;
3595 			break;
3596 
3597 		case SRP_OPT_MAX_CMD_PER_LUN:
3598 			if (match_int(args, &token) || token < 1) {
3599 				pr_warn("bad max cmd_per_lun parameter '%s'\n",
3600 					p);
3601 				goto out;
3602 			}
3603 			target->scsi_host->cmd_per_lun = token;
3604 			break;
3605 
3606 		case SRP_OPT_TARGET_CAN_QUEUE:
3607 			if (match_int(args, &token) || token < 1) {
3608 				pr_warn("bad max target_can_queue parameter '%s'\n",
3609 					p);
3610 				goto out;
3611 			}
3612 			target->target_can_queue = token;
3613 			break;
3614 
3615 		case SRP_OPT_IO_CLASS:
3616 			if (match_hex(args, &token)) {
3617 				pr_warn("bad IO class parameter '%s'\n", p);
3618 				goto out;
3619 			}
3620 			if (token != SRP_REV10_IB_IO_CLASS &&
3621 			    token != SRP_REV16A_IB_IO_CLASS) {
3622 				pr_warn("unknown IO class parameter value %x specified (use %x or %x).\n",
3623 					token, SRP_REV10_IB_IO_CLASS,
3624 					SRP_REV16A_IB_IO_CLASS);
3625 				goto out;
3626 			}
3627 			target->io_class = token;
3628 			break;
3629 
3630 		case SRP_OPT_INITIATOR_EXT:
3631 			p = match_strdup(args);
3632 			if (!p) {
3633 				ret = -ENOMEM;
3634 				goto out;
3635 			}
3636 			ret = kstrtoull(p, 16, &ull);
3637 			if (ret) {
3638 				pr_warn("bad initiator_ext value '%s'\n", p);
3639 				kfree(p);
3640 				goto out;
3641 			}
3642 			target->initiator_ext = cpu_to_be64(ull);
3643 			kfree(p);
3644 			break;
3645 
3646 		case SRP_OPT_CMD_SG_ENTRIES:
3647 			if (match_int(args, &token) || token < 1 || token > 255) {
3648 				pr_warn("bad max cmd_sg_entries parameter '%s'\n",
3649 					p);
3650 				goto out;
3651 			}
3652 			target->cmd_sg_cnt = token;
3653 			break;
3654 
3655 		case SRP_OPT_ALLOW_EXT_SG:
3656 			if (match_int(args, &token)) {
3657 				pr_warn("bad allow_ext_sg parameter '%s'\n", p);
3658 				goto out;
3659 			}
3660 			target->allow_ext_sg = !!token;
3661 			break;
3662 
3663 		case SRP_OPT_SG_TABLESIZE:
3664 			if (match_int(args, &token) || token < 1 ||
3665 					token > SG_MAX_SEGMENTS) {
3666 				pr_warn("bad max sg_tablesize parameter '%s'\n",
3667 					p);
3668 				goto out;
3669 			}
3670 			target->sg_tablesize = token;
3671 			break;
3672 
3673 		case SRP_OPT_COMP_VECTOR:
3674 			if (match_int(args, &token) || token < 0) {
3675 				pr_warn("bad comp_vector parameter '%s'\n", p);
3676 				goto out;
3677 			}
3678 			target->comp_vector = token;
3679 			break;
3680 
3681 		case SRP_OPT_TL_RETRY_COUNT:
3682 			if (match_int(args, &token) || token < 2 || token > 7) {
3683 				pr_warn("bad tl_retry_count parameter '%s' (must be a number between 2 and 7)\n",
3684 					p);
3685 				goto out;
3686 			}
3687 			target->tl_retry_count = token;
3688 			break;
3689 
3690 		default:
3691 			pr_warn("unknown parameter or missing value '%s' in target creation request\n",
3692 				p);
3693 			goto out;
3694 		}
3695 	}
3696 
3697 	for (i = 0; i < ARRAY_SIZE(srp_opt_mandatory); i++) {
3698 		if ((opt_mask & srp_opt_mandatory[i]) == srp_opt_mandatory[i]) {
3699 			ret = 0;
3700 			break;
3701 		}
3702 	}
3703 	if (ret)
3704 		pr_warn("target creation request is missing one or more parameters\n");
3705 
3706 	if (target->scsi_host->cmd_per_lun > target->scsi_host->can_queue
3707 	    && (opt_mask & SRP_OPT_MAX_CMD_PER_LUN))
3708 		pr_warn("cmd_per_lun = %d > queue_size = %d\n",
3709 			target->scsi_host->cmd_per_lun,
3710 			target->scsi_host->can_queue);
3711 
3712 out:
3713 	kfree(options);
3714 	return ret;
3715 }
3716 
3717 static ssize_t srp_create_target(struct device *dev,
3718 				 struct device_attribute *attr,
3719 				 const char *buf, size_t count)
3720 {
3721 	struct srp_host *host =
3722 		container_of(dev, struct srp_host, dev);
3723 	struct Scsi_Host *target_host;
3724 	struct srp_target_port *target;
3725 	struct srp_rdma_ch *ch;
3726 	struct srp_device *srp_dev = host->srp_dev;
3727 	struct ib_device *ibdev = srp_dev->dev;
3728 	int ret, node_idx, node, cpu, i;
3729 	unsigned int max_sectors_per_mr, mr_per_cmd = 0;
3730 	bool multich = false;
3731 
3732 	target_host = scsi_host_alloc(&srp_template,
3733 				      sizeof (struct srp_target_port));
3734 	if (!target_host)
3735 		return -ENOMEM;
3736 
3737 	target_host->transportt  = ib_srp_transport_template;
3738 	target_host->max_channel = 0;
3739 	target_host->max_id      = 1;
3740 	target_host->max_lun     = -1LL;
3741 	target_host->max_cmd_len = sizeof ((struct srp_cmd *) (void *) 0L)->cdb;
3742 
3743 	target = host_to_target(target_host);
3744 
3745 	target->net		= kobj_ns_grab_current(KOBJ_NS_TYPE_NET);
3746 	target->io_class	= SRP_REV16A_IB_IO_CLASS;
3747 	target->scsi_host	= target_host;
3748 	target->srp_host	= host;
3749 	target->lkey		= host->srp_dev->pd->local_dma_lkey;
3750 	target->global_rkey	= host->srp_dev->global_rkey;
3751 	target->cmd_sg_cnt	= cmd_sg_entries;
3752 	target->sg_tablesize	= indirect_sg_entries ? : cmd_sg_entries;
3753 	target->allow_ext_sg	= allow_ext_sg;
3754 	target->tl_retry_count	= 7;
3755 	target->queue_size	= SRP_DEFAULT_QUEUE_SIZE;
3756 
3757 	/*
3758 	 * Avoid that the SCSI host can be removed by srp_remove_target()
3759 	 * before this function returns.
3760 	 */
3761 	scsi_host_get(target->scsi_host);
3762 
3763 	ret = mutex_lock_interruptible(&host->add_target_mutex);
3764 	if (ret < 0)
3765 		goto put;
3766 
3767 	ret = srp_parse_options(target->net, buf, target);
3768 	if (ret)
3769 		goto out;
3770 
3771 	target->req_ring_size = target->queue_size - SRP_TSK_MGMT_SQ_SIZE;
3772 
3773 	if (!srp_conn_unique(target->srp_host, target)) {
3774 		if (target->using_rdma_cm) {
3775 			shost_printk(KERN_INFO, target->scsi_host,
3776 				     PFX "Already connected to target port with id_ext=%016llx;ioc_guid=%016llx;dest=%pIS\n",
3777 				     be64_to_cpu(target->id_ext),
3778 				     be64_to_cpu(target->ioc_guid),
3779 				     &target->rdma_cm.dst);
3780 		} else {
3781 			shost_printk(KERN_INFO, target->scsi_host,
3782 				     PFX "Already connected to target port with id_ext=%016llx;ioc_guid=%016llx;initiator_ext=%016llx\n",
3783 				     be64_to_cpu(target->id_ext),
3784 				     be64_to_cpu(target->ioc_guid),
3785 				     be64_to_cpu(target->initiator_ext));
3786 		}
3787 		ret = -EEXIST;
3788 		goto out;
3789 	}
3790 
3791 	if (!srp_dev->has_fmr && !srp_dev->has_fr && !target->allow_ext_sg &&
3792 	    target->cmd_sg_cnt < target->sg_tablesize) {
3793 		pr_warn("No MR pool and no external indirect descriptors, limiting sg_tablesize to cmd_sg_cnt\n");
3794 		target->sg_tablesize = target->cmd_sg_cnt;
3795 	}
3796 
3797 	if (srp_dev->use_fast_reg || srp_dev->use_fmr) {
3798 		bool gaps_reg = (ibdev->attrs.device_cap_flags &
3799 				 IB_DEVICE_SG_GAPS_REG);
3800 
3801 		max_sectors_per_mr = srp_dev->max_pages_per_mr <<
3802 				  (ilog2(srp_dev->mr_page_size) - 9);
3803 		if (!gaps_reg) {
3804 			/*
3805 			 * FR and FMR can only map one HCA page per entry. If
3806 			 * the start address is not aligned on a HCA page
3807 			 * boundary two entries will be used for the head and
3808 			 * the tail although these two entries combined
3809 			 * contain at most one HCA page of data. Hence the "+
3810 			 * 1" in the calculation below.
3811 			 *
3812 			 * The indirect data buffer descriptor is contiguous
3813 			 * so the memory for that buffer will only be
3814 			 * registered if register_always is true. Hence add
3815 			 * one to mr_per_cmd if register_always has been set.
3816 			 */
3817 			mr_per_cmd = register_always +
3818 				(target->scsi_host->max_sectors + 1 +
3819 				 max_sectors_per_mr - 1) / max_sectors_per_mr;
3820 		} else {
3821 			mr_per_cmd = register_always +
3822 				(target->sg_tablesize +
3823 				 srp_dev->max_pages_per_mr - 1) /
3824 				srp_dev->max_pages_per_mr;
3825 		}
3826 		pr_debug("max_sectors = %u; max_pages_per_mr = %u; mr_page_size = %u; max_sectors_per_mr = %u; mr_per_cmd = %u\n",
3827 			 target->scsi_host->max_sectors, srp_dev->max_pages_per_mr, srp_dev->mr_page_size,
3828 			 max_sectors_per_mr, mr_per_cmd);
3829 	}
3830 
3831 	target_host->sg_tablesize = target->sg_tablesize;
3832 	target->mr_pool_size = target->scsi_host->can_queue * mr_per_cmd;
3833 	target->mr_per_cmd = mr_per_cmd;
3834 	target->indirect_size = target->sg_tablesize *
3835 				sizeof (struct srp_direct_buf);
3836 	target->max_iu_len = sizeof (struct srp_cmd) +
3837 			     sizeof (struct srp_indirect_buf) +
3838 			     target->cmd_sg_cnt * sizeof (struct srp_direct_buf);
3839 
3840 	INIT_WORK(&target->tl_err_work, srp_tl_err_work);
3841 	INIT_WORK(&target->remove_work, srp_remove_work);
3842 	spin_lock_init(&target->lock);
3843 	ret = rdma_query_gid(ibdev, host->port, 0, &target->sgid);
3844 	if (ret)
3845 		goto out;
3846 
3847 	ret = -ENOMEM;
3848 	target->ch_count = max_t(unsigned, num_online_nodes(),
3849 				 min(ch_count ? :
3850 				     min(4 * num_online_nodes(),
3851 					 ibdev->num_comp_vectors),
3852 				     num_online_cpus()));
3853 	target->ch = kcalloc(target->ch_count, sizeof(*target->ch),
3854 			     GFP_KERNEL);
3855 	if (!target->ch)
3856 		goto out;
3857 
3858 	node_idx = 0;
3859 	for_each_online_node(node) {
3860 		const int ch_start = (node_idx * target->ch_count /
3861 				      num_online_nodes());
3862 		const int ch_end = ((node_idx + 1) * target->ch_count /
3863 				    num_online_nodes());
3864 		const int cv_start = node_idx * ibdev->num_comp_vectors /
3865 				     num_online_nodes();
3866 		const int cv_end = (node_idx + 1) * ibdev->num_comp_vectors /
3867 				   num_online_nodes();
3868 		int cpu_idx = 0;
3869 
3870 		for_each_online_cpu(cpu) {
3871 			if (cpu_to_node(cpu) != node)
3872 				continue;
3873 			if (ch_start + cpu_idx >= ch_end)
3874 				continue;
3875 			ch = &target->ch[ch_start + cpu_idx];
3876 			ch->target = target;
3877 			ch->comp_vector = cv_start == cv_end ? cv_start :
3878 				cv_start + cpu_idx % (cv_end - cv_start);
3879 			spin_lock_init(&ch->lock);
3880 			INIT_LIST_HEAD(&ch->free_tx);
3881 			ret = srp_new_cm_id(ch);
3882 			if (ret)
3883 				goto err_disconnect;
3884 
3885 			ret = srp_create_ch_ib(ch);
3886 			if (ret)
3887 				goto err_disconnect;
3888 
3889 			ret = srp_alloc_req_data(ch);
3890 			if (ret)
3891 				goto err_disconnect;
3892 
3893 			ret = srp_connect_ch(ch, multich);
3894 			if (ret) {
3895 				char dst[64];
3896 
3897 				if (target->using_rdma_cm)
3898 					snprintf(dst, sizeof(dst), "%pIS",
3899 						 &target->rdma_cm.dst);
3900 				else
3901 					snprintf(dst, sizeof(dst), "%pI6",
3902 						 target->ib_cm.orig_dgid.raw);
3903 				shost_printk(KERN_ERR, target->scsi_host,
3904 					     PFX "Connection %d/%d to %s failed\n",
3905 					     ch_start + cpu_idx,
3906 					     target->ch_count, dst);
3907 				if (node_idx == 0 && cpu_idx == 0) {
3908 					goto free_ch;
3909 				} else {
3910 					srp_free_ch_ib(target, ch);
3911 					srp_free_req_data(target, ch);
3912 					target->ch_count = ch - target->ch;
3913 					goto connected;
3914 				}
3915 			}
3916 
3917 			multich = true;
3918 			cpu_idx++;
3919 		}
3920 		node_idx++;
3921 	}
3922 
3923 connected:
3924 	target->scsi_host->nr_hw_queues = target->ch_count;
3925 
3926 	ret = srp_add_target(host, target);
3927 	if (ret)
3928 		goto err_disconnect;
3929 
3930 	if (target->state != SRP_TARGET_REMOVED) {
3931 		if (target->using_rdma_cm) {
3932 			shost_printk(KERN_DEBUG, target->scsi_host, PFX
3933 				     "new target: id_ext %016llx ioc_guid %016llx sgid %pI6 dest %pIS\n",
3934 				     be64_to_cpu(target->id_ext),
3935 				     be64_to_cpu(target->ioc_guid),
3936 				     target->sgid.raw, &target->rdma_cm.dst);
3937 		} else {
3938 			shost_printk(KERN_DEBUG, target->scsi_host, PFX
3939 				     "new target: id_ext %016llx ioc_guid %016llx pkey %04x service_id %016llx sgid %pI6 dgid %pI6\n",
3940 				     be64_to_cpu(target->id_ext),
3941 				     be64_to_cpu(target->ioc_guid),
3942 				     be16_to_cpu(target->ib_cm.pkey),
3943 				     be64_to_cpu(target->ib_cm.service_id),
3944 				     target->sgid.raw,
3945 				     target->ib_cm.orig_dgid.raw);
3946 		}
3947 	}
3948 
3949 	ret = count;
3950 
3951 out:
3952 	mutex_unlock(&host->add_target_mutex);
3953 
3954 put:
3955 	scsi_host_put(target->scsi_host);
3956 	if (ret < 0) {
3957 		/*
3958 		 * If a call to srp_remove_target() has not been scheduled,
3959 		 * drop the network namespace reference now that was obtained
3960 		 * earlier in this function.
3961 		 */
3962 		if (target->state != SRP_TARGET_REMOVED)
3963 			kobj_ns_drop(KOBJ_NS_TYPE_NET, target->net);
3964 		scsi_host_put(target->scsi_host);
3965 	}
3966 
3967 	return ret;
3968 
3969 err_disconnect:
3970 	srp_disconnect_target(target);
3971 
3972 free_ch:
3973 	for (i = 0; i < target->ch_count; i++) {
3974 		ch = &target->ch[i];
3975 		srp_free_ch_ib(target, ch);
3976 		srp_free_req_data(target, ch);
3977 	}
3978 
3979 	kfree(target->ch);
3980 	goto out;
3981 }
3982 
3983 static DEVICE_ATTR(add_target, S_IWUSR, NULL, srp_create_target);
3984 
3985 static ssize_t show_ibdev(struct device *dev, struct device_attribute *attr,
3986 			  char *buf)
3987 {
3988 	struct srp_host *host = container_of(dev, struct srp_host, dev);
3989 
3990 	return sprintf(buf, "%s\n", host->srp_dev->dev->name);
3991 }
3992 
3993 static DEVICE_ATTR(ibdev, S_IRUGO, show_ibdev, NULL);
3994 
3995 static ssize_t show_port(struct device *dev, struct device_attribute *attr,
3996 			 char *buf)
3997 {
3998 	struct srp_host *host = container_of(dev, struct srp_host, dev);
3999 
4000 	return sprintf(buf, "%d\n", host->port);
4001 }
4002 
4003 static DEVICE_ATTR(port, S_IRUGO, show_port, NULL);
4004 
4005 static struct srp_host *srp_add_port(struct srp_device *device, u8 port)
4006 {
4007 	struct srp_host *host;
4008 
4009 	host = kzalloc(sizeof *host, GFP_KERNEL);
4010 	if (!host)
4011 		return NULL;
4012 
4013 	INIT_LIST_HEAD(&host->target_list);
4014 	spin_lock_init(&host->target_lock);
4015 	init_completion(&host->released);
4016 	mutex_init(&host->add_target_mutex);
4017 	host->srp_dev = device;
4018 	host->port = port;
4019 
4020 	host->dev.class = &srp_class;
4021 	host->dev.parent = device->dev->dev.parent;
4022 	dev_set_name(&host->dev, "srp-%s-%d", device->dev->name, port);
4023 
4024 	if (device_register(&host->dev))
4025 		goto free_host;
4026 	if (device_create_file(&host->dev, &dev_attr_add_target))
4027 		goto err_class;
4028 	if (device_create_file(&host->dev, &dev_attr_ibdev))
4029 		goto err_class;
4030 	if (device_create_file(&host->dev, &dev_attr_port))
4031 		goto err_class;
4032 
4033 	return host;
4034 
4035 err_class:
4036 	device_unregister(&host->dev);
4037 
4038 free_host:
4039 	kfree(host);
4040 
4041 	return NULL;
4042 }
4043 
4044 static void srp_add_one(struct ib_device *device)
4045 {
4046 	struct srp_device *srp_dev;
4047 	struct ib_device_attr *attr = &device->attrs;
4048 	struct srp_host *host;
4049 	int mr_page_shift, p;
4050 	u64 max_pages_per_mr;
4051 	unsigned int flags = 0;
4052 
4053 	srp_dev = kzalloc(sizeof(*srp_dev), GFP_KERNEL);
4054 	if (!srp_dev)
4055 		return;
4056 
4057 	/*
4058 	 * Use the smallest page size supported by the HCA, down to a
4059 	 * minimum of 4096 bytes. We're unlikely to build large sglists
4060 	 * out of smaller entries.
4061 	 */
4062 	mr_page_shift		= max(12, ffs(attr->page_size_cap) - 1);
4063 	srp_dev->mr_page_size	= 1 << mr_page_shift;
4064 	srp_dev->mr_page_mask	= ~((u64) srp_dev->mr_page_size - 1);
4065 	max_pages_per_mr	= attr->max_mr_size;
4066 	do_div(max_pages_per_mr, srp_dev->mr_page_size);
4067 	pr_debug("%s: %llu / %u = %llu <> %u\n", __func__,
4068 		 attr->max_mr_size, srp_dev->mr_page_size,
4069 		 max_pages_per_mr, SRP_MAX_PAGES_PER_MR);
4070 	srp_dev->max_pages_per_mr = min_t(u64, SRP_MAX_PAGES_PER_MR,
4071 					  max_pages_per_mr);
4072 
4073 	srp_dev->has_fmr = (device->alloc_fmr && device->dealloc_fmr &&
4074 			    device->map_phys_fmr && device->unmap_fmr);
4075 	srp_dev->has_fr = (attr->device_cap_flags &
4076 			   IB_DEVICE_MEM_MGT_EXTENSIONS);
4077 	if (!never_register && !srp_dev->has_fmr && !srp_dev->has_fr) {
4078 		dev_warn(&device->dev, "neither FMR nor FR is supported\n");
4079 	} else if (!never_register &&
4080 		   attr->max_mr_size >= 2 * srp_dev->mr_page_size) {
4081 		srp_dev->use_fast_reg = (srp_dev->has_fr &&
4082 					 (!srp_dev->has_fmr || prefer_fr));
4083 		srp_dev->use_fmr = !srp_dev->use_fast_reg && srp_dev->has_fmr;
4084 	}
4085 
4086 	if (never_register || !register_always ||
4087 	    (!srp_dev->has_fmr && !srp_dev->has_fr))
4088 		flags |= IB_PD_UNSAFE_GLOBAL_RKEY;
4089 
4090 	if (srp_dev->use_fast_reg) {
4091 		srp_dev->max_pages_per_mr =
4092 			min_t(u32, srp_dev->max_pages_per_mr,
4093 			      attr->max_fast_reg_page_list_len);
4094 	}
4095 	srp_dev->mr_max_size	= srp_dev->mr_page_size *
4096 				   srp_dev->max_pages_per_mr;
4097 	pr_debug("%s: mr_page_shift = %d, device->max_mr_size = %#llx, device->max_fast_reg_page_list_len = %u, max_pages_per_mr = %d, mr_max_size = %#x\n",
4098 		 device->name, mr_page_shift, attr->max_mr_size,
4099 		 attr->max_fast_reg_page_list_len,
4100 		 srp_dev->max_pages_per_mr, srp_dev->mr_max_size);
4101 
4102 	INIT_LIST_HEAD(&srp_dev->dev_list);
4103 
4104 	srp_dev->dev = device;
4105 	srp_dev->pd  = ib_alloc_pd(device, flags);
4106 	if (IS_ERR(srp_dev->pd))
4107 		goto free_dev;
4108 
4109 	if (flags & IB_PD_UNSAFE_GLOBAL_RKEY) {
4110 		srp_dev->global_rkey = srp_dev->pd->unsafe_global_rkey;
4111 		WARN_ON_ONCE(srp_dev->global_rkey == 0);
4112 	}
4113 
4114 	for (p = rdma_start_port(device); p <= rdma_end_port(device); ++p) {
4115 		host = srp_add_port(srp_dev, p);
4116 		if (host)
4117 			list_add_tail(&host->list, &srp_dev->dev_list);
4118 	}
4119 
4120 	ib_set_client_data(device, &srp_client, srp_dev);
4121 	return;
4122 
4123 free_dev:
4124 	kfree(srp_dev);
4125 }
4126 
4127 static void srp_remove_one(struct ib_device *device, void *client_data)
4128 {
4129 	struct srp_device *srp_dev;
4130 	struct srp_host *host, *tmp_host;
4131 	struct srp_target_port *target;
4132 
4133 	srp_dev = client_data;
4134 	if (!srp_dev)
4135 		return;
4136 
4137 	list_for_each_entry_safe(host, tmp_host, &srp_dev->dev_list, list) {
4138 		device_unregister(&host->dev);
4139 		/*
4140 		 * Wait for the sysfs entry to go away, so that no new
4141 		 * target ports can be created.
4142 		 */
4143 		wait_for_completion(&host->released);
4144 
4145 		/*
4146 		 * Remove all target ports.
4147 		 */
4148 		spin_lock(&host->target_lock);
4149 		list_for_each_entry(target, &host->target_list, list)
4150 			srp_queue_remove_work(target);
4151 		spin_unlock(&host->target_lock);
4152 
4153 		/*
4154 		 * Wait for tl_err and target port removal tasks.
4155 		 */
4156 		flush_workqueue(system_long_wq);
4157 		flush_workqueue(srp_remove_wq);
4158 
4159 		kfree(host);
4160 	}
4161 
4162 	ib_dealloc_pd(srp_dev->pd);
4163 
4164 	kfree(srp_dev);
4165 }
4166 
4167 static struct srp_function_template ib_srp_transport_functions = {
4168 	.has_rport_state	 = true,
4169 	.reset_timer_if_blocked	 = true,
4170 	.reconnect_delay	 = &srp_reconnect_delay,
4171 	.fast_io_fail_tmo	 = &srp_fast_io_fail_tmo,
4172 	.dev_loss_tmo		 = &srp_dev_loss_tmo,
4173 	.reconnect		 = srp_rport_reconnect,
4174 	.rport_delete		 = srp_rport_delete,
4175 	.terminate_rport_io	 = srp_terminate_io,
4176 };
4177 
4178 static int __init srp_init_module(void)
4179 {
4180 	int ret;
4181 
4182 	if (srp_sg_tablesize) {
4183 		pr_warn("srp_sg_tablesize is deprecated, please use cmd_sg_entries\n");
4184 		if (!cmd_sg_entries)
4185 			cmd_sg_entries = srp_sg_tablesize;
4186 	}
4187 
4188 	if (!cmd_sg_entries)
4189 		cmd_sg_entries = SRP_DEF_SG_TABLESIZE;
4190 
4191 	if (cmd_sg_entries > 255) {
4192 		pr_warn("Clamping cmd_sg_entries to 255\n");
4193 		cmd_sg_entries = 255;
4194 	}
4195 
4196 	if (!indirect_sg_entries)
4197 		indirect_sg_entries = cmd_sg_entries;
4198 	else if (indirect_sg_entries < cmd_sg_entries) {
4199 		pr_warn("Bumping up indirect_sg_entries to match cmd_sg_entries (%u)\n",
4200 			cmd_sg_entries);
4201 		indirect_sg_entries = cmd_sg_entries;
4202 	}
4203 
4204 	if (indirect_sg_entries > SG_MAX_SEGMENTS) {
4205 		pr_warn("Clamping indirect_sg_entries to %u\n",
4206 			SG_MAX_SEGMENTS);
4207 		indirect_sg_entries = SG_MAX_SEGMENTS;
4208 	}
4209 
4210 	srp_remove_wq = create_workqueue("srp_remove");
4211 	if (!srp_remove_wq) {
4212 		ret = -ENOMEM;
4213 		goto out;
4214 	}
4215 
4216 	ret = -ENOMEM;
4217 	ib_srp_transport_template =
4218 		srp_attach_transport(&ib_srp_transport_functions);
4219 	if (!ib_srp_transport_template)
4220 		goto destroy_wq;
4221 
4222 	ret = class_register(&srp_class);
4223 	if (ret) {
4224 		pr_err("couldn't register class infiniband_srp\n");
4225 		goto release_tr;
4226 	}
4227 
4228 	ib_sa_register_client(&srp_sa_client);
4229 
4230 	ret = ib_register_client(&srp_client);
4231 	if (ret) {
4232 		pr_err("couldn't register IB client\n");
4233 		goto unreg_sa;
4234 	}
4235 
4236 out:
4237 	return ret;
4238 
4239 unreg_sa:
4240 	ib_sa_unregister_client(&srp_sa_client);
4241 	class_unregister(&srp_class);
4242 
4243 release_tr:
4244 	srp_release_transport(ib_srp_transport_template);
4245 
4246 destroy_wq:
4247 	destroy_workqueue(srp_remove_wq);
4248 	goto out;
4249 }
4250 
4251 static void __exit srp_cleanup_module(void)
4252 {
4253 	ib_unregister_client(&srp_client);
4254 	ib_sa_unregister_client(&srp_sa_client);
4255 	class_unregister(&srp_class);
4256 	srp_release_transport(ib_srp_transport_template);
4257 	destroy_workqueue(srp_remove_wq);
4258 }
4259 
4260 module_init(srp_init_module);
4261 module_exit(srp_cleanup_module);
4262