Merge tag 'metag-for-v4.4' of git://git.kernel.org/pub/scm/linux/kernel/git/jhogan...
[deliverable/linux.git] / drivers / infiniband / ulp / srp / ib_srp.c
1 /*
2 * Copyright (c) 2005 Cisco Systems. All rights reserved.
3 *
4 * This software is available to you under a choice of one of two
5 * licenses. You may choose to be licensed under the terms of the GNU
6 * General Public License (GPL) Version 2, available from the file
7 * COPYING in the main directory of this source tree, or the
8 * OpenIB.org BSD license below:
9 *
10 * Redistribution and use in source and binary forms, with or
11 * without modification, are permitted provided that the following
12 * conditions are met:
13 *
14 * - Redistributions of source code must retain the above
15 * copyright notice, this list of conditions and the following
16 * disclaimer.
17 *
18 * - Redistributions in binary form must reproduce the above
19 * copyright notice, this list of conditions and the following
20 * disclaimer in the documentation and/or other materials
21 * provided with the distribution.
22 *
23 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
24 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
25 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
26 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
27 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
28 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
29 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
30 * SOFTWARE.
31 */
32
33 #define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
34
35 #include <linux/module.h>
36 #include <linux/init.h>
37 #include <linux/slab.h>
38 #include <linux/err.h>
39 #include <linux/string.h>
40 #include <linux/parser.h>
41 #include <linux/random.h>
42 #include <linux/jiffies.h>
43 #include <rdma/ib_cache.h>
44
45 #include <linux/atomic.h>
46
47 #include <scsi/scsi.h>
48 #include <scsi/scsi_device.h>
49 #include <scsi/scsi_dbg.h>
50 #include <scsi/scsi_tcq.h>
51 #include <scsi/srp.h>
52 #include <scsi/scsi_transport_srp.h>
53
54 #include "ib_srp.h"
55
56 #define DRV_NAME "ib_srp"
57 #define PFX DRV_NAME ": "
58 #define DRV_VERSION "2.0"
59 #define DRV_RELDATE "July 26, 2015"
60
61 MODULE_AUTHOR("Roland Dreier");
62 MODULE_DESCRIPTION("InfiniBand SCSI RDMA Protocol initiator");
63 MODULE_LICENSE("Dual BSD/GPL");
64 MODULE_VERSION(DRV_VERSION);
65 MODULE_INFO(release_date, DRV_RELDATE);
66
67 static unsigned int srp_sg_tablesize;
68 static unsigned int cmd_sg_entries;
69 static unsigned int indirect_sg_entries;
70 static bool allow_ext_sg;
71 static bool prefer_fr = true;
72 static bool register_always = true;
73 static int topspin_workarounds = 1;
74
75 module_param(srp_sg_tablesize, uint, 0444);
76 MODULE_PARM_DESC(srp_sg_tablesize, "Deprecated name for cmd_sg_entries");
77
78 module_param(cmd_sg_entries, uint, 0444);
79 MODULE_PARM_DESC(cmd_sg_entries,
80 "Default number of gather/scatter entries in the SRP command (default is 12, max 255)");
81
82 module_param(indirect_sg_entries, uint, 0444);
83 MODULE_PARM_DESC(indirect_sg_entries,
84 "Default max number of gather/scatter entries (default is 12, max is " __stringify(SCSI_MAX_SG_CHAIN_SEGMENTS) ")");
85
86 module_param(allow_ext_sg, bool, 0444);
87 MODULE_PARM_DESC(allow_ext_sg,
88 "Default behavior when there are more than cmd_sg_entries S/G entries after mapping; fails the request when false (default false)");
89
90 module_param(topspin_workarounds, int, 0444);
91 MODULE_PARM_DESC(topspin_workarounds,
92 "Enable workarounds for Topspin/Cisco SRP target bugs if != 0");
93
94 module_param(prefer_fr, bool, 0444);
95 MODULE_PARM_DESC(prefer_fr,
96 "Whether to use fast registration if both FMR and fast registration are supported");
97
98 module_param(register_always, bool, 0444);
99 MODULE_PARM_DESC(register_always,
100 "Use memory registration even for contiguous memory regions");
101
102 static const struct kernel_param_ops srp_tmo_ops;
103
104 static int srp_reconnect_delay = 10;
105 module_param_cb(reconnect_delay, &srp_tmo_ops, &srp_reconnect_delay,
106 S_IRUGO | S_IWUSR);
107 MODULE_PARM_DESC(reconnect_delay, "Time between successive reconnect attempts");
108
109 static int srp_fast_io_fail_tmo = 15;
110 module_param_cb(fast_io_fail_tmo, &srp_tmo_ops, &srp_fast_io_fail_tmo,
111 S_IRUGO | S_IWUSR);
112 MODULE_PARM_DESC(fast_io_fail_tmo,
113 "Number of seconds between the observation of a transport"
114 " layer error and failing all I/O. \"off\" means that this"
115 " functionality is disabled.");
116
117 static int srp_dev_loss_tmo = 600;
118 module_param_cb(dev_loss_tmo, &srp_tmo_ops, &srp_dev_loss_tmo,
119 S_IRUGO | S_IWUSR);
120 MODULE_PARM_DESC(dev_loss_tmo,
121 "Maximum number of seconds that the SRP transport should"
122 " insulate transport layer errors. After this time has been"
123 " exceeded the SCSI host is removed. Should be"
124 " between 1 and " __stringify(SCSI_DEVICE_BLOCK_MAX_TIMEOUT)
125 " if fast_io_fail_tmo has not been set. \"off\" means that"
126 " this functionality is disabled.");
127
128 static unsigned ch_count;
129 module_param(ch_count, uint, 0444);
130 MODULE_PARM_DESC(ch_count,
131 "Number of RDMA channels to use for communication with an SRP target. Using more than one channel improves performance if the HCA supports multiple completion vectors. The default value is the minimum of four times the number of online CPU sockets and the number of completion vectors supported by the HCA.");
132
133 static void srp_add_one(struct ib_device *device);
134 static void srp_remove_one(struct ib_device *device, void *client_data);
135 static void srp_recv_completion(struct ib_cq *cq, void *ch_ptr);
136 static void srp_send_completion(struct ib_cq *cq, void *ch_ptr);
137 static int srp_cm_handler(struct ib_cm_id *cm_id, struct ib_cm_event *event);
138
139 static struct scsi_transport_template *ib_srp_transport_template;
140 static struct workqueue_struct *srp_remove_wq;
141
142 static struct ib_client srp_client = {
143 .name = "srp",
144 .add = srp_add_one,
145 .remove = srp_remove_one
146 };
147
148 static struct ib_sa_client srp_sa_client;
149
150 static int srp_tmo_get(char *buffer, const struct kernel_param *kp)
151 {
152 int tmo = *(int *)kp->arg;
153
154 if (tmo >= 0)
155 return sprintf(buffer, "%d", tmo);
156 else
157 return sprintf(buffer, "off");
158 }
159
160 static int srp_tmo_set(const char *val, const struct kernel_param *kp)
161 {
162 int tmo, res;
163
164 res = srp_parse_tmo(&tmo, val);
165 if (res)
166 goto out;
167
168 if (kp->arg == &srp_reconnect_delay)
169 res = srp_tmo_valid(tmo, srp_fast_io_fail_tmo,
170 srp_dev_loss_tmo);
171 else if (kp->arg == &srp_fast_io_fail_tmo)
172 res = srp_tmo_valid(srp_reconnect_delay, tmo, srp_dev_loss_tmo);
173 else
174 res = srp_tmo_valid(srp_reconnect_delay, srp_fast_io_fail_tmo,
175 tmo);
176 if (res)
177 goto out;
178 *(int *)kp->arg = tmo;
179
180 out:
181 return res;
182 }
183
184 static const struct kernel_param_ops srp_tmo_ops = {
185 .get = srp_tmo_get,
186 .set = srp_tmo_set,
187 };
188
189 static inline struct srp_target_port *host_to_target(struct Scsi_Host *host)
190 {
191 return (struct srp_target_port *) host->hostdata;
192 }
193
194 static const char *srp_target_info(struct Scsi_Host *host)
195 {
196 return host_to_target(host)->target_name;
197 }
198
199 static int srp_target_is_topspin(struct srp_target_port *target)
200 {
201 static const u8 topspin_oui[3] = { 0x00, 0x05, 0xad };
202 static const u8 cisco_oui[3] = { 0x00, 0x1b, 0x0d };
203
204 return topspin_workarounds &&
205 (!memcmp(&target->ioc_guid, topspin_oui, sizeof topspin_oui) ||
206 !memcmp(&target->ioc_guid, cisco_oui, sizeof cisco_oui));
207 }
208
209 static struct srp_iu *srp_alloc_iu(struct srp_host *host, size_t size,
210 gfp_t gfp_mask,
211 enum dma_data_direction direction)
212 {
213 struct srp_iu *iu;
214
215 iu = kmalloc(sizeof *iu, gfp_mask);
216 if (!iu)
217 goto out;
218
219 iu->buf = kzalloc(size, gfp_mask);
220 if (!iu->buf)
221 goto out_free_iu;
222
223 iu->dma = ib_dma_map_single(host->srp_dev->dev, iu->buf, size,
224 direction);
225 if (ib_dma_mapping_error(host->srp_dev->dev, iu->dma))
226 goto out_free_buf;
227
228 iu->size = size;
229 iu->direction = direction;
230
231 return iu;
232
233 out_free_buf:
234 kfree(iu->buf);
235 out_free_iu:
236 kfree(iu);
237 out:
238 return NULL;
239 }
240
241 static void srp_free_iu(struct srp_host *host, struct srp_iu *iu)
242 {
243 if (!iu)
244 return;
245
246 ib_dma_unmap_single(host->srp_dev->dev, iu->dma, iu->size,
247 iu->direction);
248 kfree(iu->buf);
249 kfree(iu);
250 }
251
252 static void srp_qp_event(struct ib_event *event, void *context)
253 {
254 pr_debug("QP event %s (%d)\n",
255 ib_event_msg(event->event), event->event);
256 }
257
258 static int srp_init_qp(struct srp_target_port *target,
259 struct ib_qp *qp)
260 {
261 struct ib_qp_attr *attr;
262 int ret;
263
264 attr = kmalloc(sizeof *attr, GFP_KERNEL);
265 if (!attr)
266 return -ENOMEM;
267
268 ret = ib_find_cached_pkey(target->srp_host->srp_dev->dev,
269 target->srp_host->port,
270 be16_to_cpu(target->pkey),
271 &attr->pkey_index);
272 if (ret)
273 goto out;
274
275 attr->qp_state = IB_QPS_INIT;
276 attr->qp_access_flags = (IB_ACCESS_REMOTE_READ |
277 IB_ACCESS_REMOTE_WRITE);
278 attr->port_num = target->srp_host->port;
279
280 ret = ib_modify_qp(qp, attr,
281 IB_QP_STATE |
282 IB_QP_PKEY_INDEX |
283 IB_QP_ACCESS_FLAGS |
284 IB_QP_PORT);
285
286 out:
287 kfree(attr);
288 return ret;
289 }
290
291 static int srp_new_cm_id(struct srp_rdma_ch *ch)
292 {
293 struct srp_target_port *target = ch->target;
294 struct ib_cm_id *new_cm_id;
295
296 new_cm_id = ib_create_cm_id(target->srp_host->srp_dev->dev,
297 srp_cm_handler, ch);
298 if (IS_ERR(new_cm_id))
299 return PTR_ERR(new_cm_id);
300
301 if (ch->cm_id)
302 ib_destroy_cm_id(ch->cm_id);
303 ch->cm_id = new_cm_id;
304 ch->path.sgid = target->sgid;
305 ch->path.dgid = target->orig_dgid;
306 ch->path.pkey = target->pkey;
307 ch->path.service_id = target->service_id;
308
309 return 0;
310 }
311
312 static struct ib_fmr_pool *srp_alloc_fmr_pool(struct srp_target_port *target)
313 {
314 struct srp_device *dev = target->srp_host->srp_dev;
315 struct ib_fmr_pool_param fmr_param;
316
317 memset(&fmr_param, 0, sizeof(fmr_param));
318 fmr_param.pool_size = target->scsi_host->can_queue;
319 fmr_param.dirty_watermark = fmr_param.pool_size / 4;
320 fmr_param.cache = 1;
321 fmr_param.max_pages_per_fmr = dev->max_pages_per_mr;
322 fmr_param.page_shift = ilog2(dev->mr_page_size);
323 fmr_param.access = (IB_ACCESS_LOCAL_WRITE |
324 IB_ACCESS_REMOTE_WRITE |
325 IB_ACCESS_REMOTE_READ);
326
327 return ib_create_fmr_pool(dev->pd, &fmr_param);
328 }
329
330 /**
331 * srp_destroy_fr_pool() - free the resources owned by a pool
332 * @pool: Fast registration pool to be destroyed.
333 */
334 static void srp_destroy_fr_pool(struct srp_fr_pool *pool)
335 {
336 int i;
337 struct srp_fr_desc *d;
338
339 if (!pool)
340 return;
341
342 for (i = 0, d = &pool->desc[0]; i < pool->size; i++, d++) {
343 if (d->mr)
344 ib_dereg_mr(d->mr);
345 }
346 kfree(pool);
347 }
348
349 /**
350 * srp_create_fr_pool() - allocate and initialize a pool for fast registration
351 * @device: IB device to allocate fast registration descriptors for.
352 * @pd: Protection domain associated with the FR descriptors.
353 * @pool_size: Number of descriptors to allocate.
354 * @max_page_list_len: Maximum fast registration work request page list length.
355 */
356 static struct srp_fr_pool *srp_create_fr_pool(struct ib_device *device,
357 struct ib_pd *pd, int pool_size,
358 int max_page_list_len)
359 {
360 struct srp_fr_pool *pool;
361 struct srp_fr_desc *d;
362 struct ib_mr *mr;
363 int i, ret = -EINVAL;
364
365 if (pool_size <= 0)
366 goto err;
367 ret = -ENOMEM;
368 pool = kzalloc(sizeof(struct srp_fr_pool) +
369 pool_size * sizeof(struct srp_fr_desc), GFP_KERNEL);
370 if (!pool)
371 goto err;
372 pool->size = pool_size;
373 pool->max_page_list_len = max_page_list_len;
374 spin_lock_init(&pool->lock);
375 INIT_LIST_HEAD(&pool->free_list);
376
377 for (i = 0, d = &pool->desc[0]; i < pool->size; i++, d++) {
378 mr = ib_alloc_mr(pd, IB_MR_TYPE_MEM_REG,
379 max_page_list_len);
380 if (IS_ERR(mr)) {
381 ret = PTR_ERR(mr);
382 goto destroy_pool;
383 }
384 d->mr = mr;
385 list_add_tail(&d->entry, &pool->free_list);
386 }
387
388 out:
389 return pool;
390
391 destroy_pool:
392 srp_destroy_fr_pool(pool);
393
394 err:
395 pool = ERR_PTR(ret);
396 goto out;
397 }
398
399 /**
400 * srp_fr_pool_get() - obtain a descriptor suitable for fast registration
401 * @pool: Pool to obtain descriptor from.
402 */
403 static struct srp_fr_desc *srp_fr_pool_get(struct srp_fr_pool *pool)
404 {
405 struct srp_fr_desc *d = NULL;
406 unsigned long flags;
407
408 spin_lock_irqsave(&pool->lock, flags);
409 if (!list_empty(&pool->free_list)) {
410 d = list_first_entry(&pool->free_list, typeof(*d), entry);
411 list_del(&d->entry);
412 }
413 spin_unlock_irqrestore(&pool->lock, flags);
414
415 return d;
416 }
417
418 /**
419 * srp_fr_pool_put() - put an FR descriptor back in the free list
420 * @pool: Pool the descriptor was allocated from.
421 * @desc: Pointer to an array of fast registration descriptor pointers.
422 * @n: Number of descriptors to put back.
423 *
424 * Note: The caller must already have queued an invalidation request for
425 * desc->mr->rkey before calling this function.
426 */
427 static void srp_fr_pool_put(struct srp_fr_pool *pool, struct srp_fr_desc **desc,
428 int n)
429 {
430 unsigned long flags;
431 int i;
432
433 spin_lock_irqsave(&pool->lock, flags);
434 for (i = 0; i < n; i++)
435 list_add(&desc[i]->entry, &pool->free_list);
436 spin_unlock_irqrestore(&pool->lock, flags);
437 }
438
439 static struct srp_fr_pool *srp_alloc_fr_pool(struct srp_target_port *target)
440 {
441 struct srp_device *dev = target->srp_host->srp_dev;
442
443 return srp_create_fr_pool(dev->dev, dev->pd,
444 target->scsi_host->can_queue,
445 dev->max_pages_per_mr);
446 }
447
448 /**
449 * srp_destroy_qp() - destroy an RDMA queue pair
450 * @ch: SRP RDMA channel.
451 *
452 * Change a queue pair into the error state and wait until all receive
453 * completions have been processed before destroying it. This avoids that
454 * the receive completion handler can access the queue pair while it is
455 * being destroyed.
456 */
457 static void srp_destroy_qp(struct srp_rdma_ch *ch)
458 {
459 static struct ib_qp_attr attr = { .qp_state = IB_QPS_ERR };
460 static struct ib_recv_wr wr = { .wr_id = SRP_LAST_WR_ID };
461 struct ib_recv_wr *bad_wr;
462 int ret;
463
464 /* Destroying a QP and reusing ch->done is only safe if not connected */
465 WARN_ON_ONCE(ch->connected);
466
467 ret = ib_modify_qp(ch->qp, &attr, IB_QP_STATE);
468 WARN_ONCE(ret, "ib_cm_init_qp_attr() returned %d\n", ret);
469 if (ret)
470 goto out;
471
472 init_completion(&ch->done);
473 ret = ib_post_recv(ch->qp, &wr, &bad_wr);
474 WARN_ONCE(ret, "ib_post_recv() returned %d\n", ret);
475 if (ret == 0)
476 wait_for_completion(&ch->done);
477
478 out:
479 ib_destroy_qp(ch->qp);
480 }
481
482 static int srp_create_ch_ib(struct srp_rdma_ch *ch)
483 {
484 struct srp_target_port *target = ch->target;
485 struct srp_device *dev = target->srp_host->srp_dev;
486 struct ib_qp_init_attr *init_attr;
487 struct ib_cq *recv_cq, *send_cq;
488 struct ib_qp *qp;
489 struct ib_fmr_pool *fmr_pool = NULL;
490 struct srp_fr_pool *fr_pool = NULL;
491 const int m = 1 + dev->use_fast_reg;
492 struct ib_cq_init_attr cq_attr = {};
493 int ret;
494
495 init_attr = kzalloc(sizeof *init_attr, GFP_KERNEL);
496 if (!init_attr)
497 return -ENOMEM;
498
499 /* + 1 for SRP_LAST_WR_ID */
500 cq_attr.cqe = target->queue_size + 1;
501 cq_attr.comp_vector = ch->comp_vector;
502 recv_cq = ib_create_cq(dev->dev, srp_recv_completion, NULL, ch,
503 &cq_attr);
504 if (IS_ERR(recv_cq)) {
505 ret = PTR_ERR(recv_cq);
506 goto err;
507 }
508
509 cq_attr.cqe = m * target->queue_size;
510 cq_attr.comp_vector = ch->comp_vector;
511 send_cq = ib_create_cq(dev->dev, srp_send_completion, NULL, ch,
512 &cq_attr);
513 if (IS_ERR(send_cq)) {
514 ret = PTR_ERR(send_cq);
515 goto err_recv_cq;
516 }
517
518 ib_req_notify_cq(recv_cq, IB_CQ_NEXT_COMP);
519
520 init_attr->event_handler = srp_qp_event;
521 init_attr->cap.max_send_wr = m * target->queue_size;
522 init_attr->cap.max_recv_wr = target->queue_size + 1;
523 init_attr->cap.max_recv_sge = 1;
524 init_attr->cap.max_send_sge = 1;
525 init_attr->sq_sig_type = IB_SIGNAL_REQ_WR;
526 init_attr->qp_type = IB_QPT_RC;
527 init_attr->send_cq = send_cq;
528 init_attr->recv_cq = recv_cq;
529
530 qp = ib_create_qp(dev->pd, init_attr);
531 if (IS_ERR(qp)) {
532 ret = PTR_ERR(qp);
533 goto err_send_cq;
534 }
535
536 ret = srp_init_qp(target, qp);
537 if (ret)
538 goto err_qp;
539
540 if (dev->use_fast_reg) {
541 fr_pool = srp_alloc_fr_pool(target);
542 if (IS_ERR(fr_pool)) {
543 ret = PTR_ERR(fr_pool);
544 shost_printk(KERN_WARNING, target->scsi_host, PFX
545 "FR pool allocation failed (%d)\n", ret);
546 goto err_qp;
547 }
548 } else if (dev->use_fmr) {
549 fmr_pool = srp_alloc_fmr_pool(target);
550 if (IS_ERR(fmr_pool)) {
551 ret = PTR_ERR(fmr_pool);
552 shost_printk(KERN_WARNING, target->scsi_host, PFX
553 "FMR pool allocation failed (%d)\n", ret);
554 goto err_qp;
555 }
556 }
557
558 if (ch->qp)
559 srp_destroy_qp(ch);
560 if (ch->recv_cq)
561 ib_destroy_cq(ch->recv_cq);
562 if (ch->send_cq)
563 ib_destroy_cq(ch->send_cq);
564
565 ch->qp = qp;
566 ch->recv_cq = recv_cq;
567 ch->send_cq = send_cq;
568
569 if (dev->use_fast_reg) {
570 if (ch->fr_pool)
571 srp_destroy_fr_pool(ch->fr_pool);
572 ch->fr_pool = fr_pool;
573 } else if (dev->use_fmr) {
574 if (ch->fmr_pool)
575 ib_destroy_fmr_pool(ch->fmr_pool);
576 ch->fmr_pool = fmr_pool;
577 }
578
579 kfree(init_attr);
580 return 0;
581
582 err_qp:
583 ib_destroy_qp(qp);
584
585 err_send_cq:
586 ib_destroy_cq(send_cq);
587
588 err_recv_cq:
589 ib_destroy_cq(recv_cq);
590
591 err:
592 kfree(init_attr);
593 return ret;
594 }
595
596 /*
597 * Note: this function may be called without srp_alloc_iu_bufs() having been
598 * invoked. Hence the ch->[rt]x_ring checks.
599 */
600 static void srp_free_ch_ib(struct srp_target_port *target,
601 struct srp_rdma_ch *ch)
602 {
603 struct srp_device *dev = target->srp_host->srp_dev;
604 int i;
605
606 if (!ch->target)
607 return;
608
609 if (ch->cm_id) {
610 ib_destroy_cm_id(ch->cm_id);
611 ch->cm_id = NULL;
612 }
613
614 /* If srp_new_cm_id() succeeded but srp_create_ch_ib() not, return. */
615 if (!ch->qp)
616 return;
617
618 if (dev->use_fast_reg) {
619 if (ch->fr_pool)
620 srp_destroy_fr_pool(ch->fr_pool);
621 } else if (dev->use_fmr) {
622 if (ch->fmr_pool)
623 ib_destroy_fmr_pool(ch->fmr_pool);
624 }
625 srp_destroy_qp(ch);
626 ib_destroy_cq(ch->send_cq);
627 ib_destroy_cq(ch->recv_cq);
628
629 /*
630 * Avoid that the SCSI error handler tries to use this channel after
631 * it has been freed. The SCSI error handler can namely continue
632 * trying to perform recovery actions after scsi_remove_host()
633 * returned.
634 */
635 ch->target = NULL;
636
637 ch->qp = NULL;
638 ch->send_cq = ch->recv_cq = NULL;
639
640 if (ch->rx_ring) {
641 for (i = 0; i < target->queue_size; ++i)
642 srp_free_iu(target->srp_host, ch->rx_ring[i]);
643 kfree(ch->rx_ring);
644 ch->rx_ring = NULL;
645 }
646 if (ch->tx_ring) {
647 for (i = 0; i < target->queue_size; ++i)
648 srp_free_iu(target->srp_host, ch->tx_ring[i]);
649 kfree(ch->tx_ring);
650 ch->tx_ring = NULL;
651 }
652 }
653
654 static void srp_path_rec_completion(int status,
655 struct ib_sa_path_rec *pathrec,
656 void *ch_ptr)
657 {
658 struct srp_rdma_ch *ch = ch_ptr;
659 struct srp_target_port *target = ch->target;
660
661 ch->status = status;
662 if (status)
663 shost_printk(KERN_ERR, target->scsi_host,
664 PFX "Got failed path rec status %d\n", status);
665 else
666 ch->path = *pathrec;
667 complete(&ch->done);
668 }
669
670 static int srp_lookup_path(struct srp_rdma_ch *ch)
671 {
672 struct srp_target_port *target = ch->target;
673 int ret;
674
675 ch->path.numb_path = 1;
676
677 init_completion(&ch->done);
678
679 ch->path_query_id = ib_sa_path_rec_get(&srp_sa_client,
680 target->srp_host->srp_dev->dev,
681 target->srp_host->port,
682 &ch->path,
683 IB_SA_PATH_REC_SERVICE_ID |
684 IB_SA_PATH_REC_DGID |
685 IB_SA_PATH_REC_SGID |
686 IB_SA_PATH_REC_NUMB_PATH |
687 IB_SA_PATH_REC_PKEY,
688 SRP_PATH_REC_TIMEOUT_MS,
689 GFP_KERNEL,
690 srp_path_rec_completion,
691 ch, &ch->path_query);
692 if (ch->path_query_id < 0)
693 return ch->path_query_id;
694
695 ret = wait_for_completion_interruptible(&ch->done);
696 if (ret < 0)
697 return ret;
698
699 if (ch->status < 0)
700 shost_printk(KERN_WARNING, target->scsi_host,
701 PFX "Path record query failed\n");
702
703 return ch->status;
704 }
705
706 static int srp_send_req(struct srp_rdma_ch *ch, bool multich)
707 {
708 struct srp_target_port *target = ch->target;
709 struct {
710 struct ib_cm_req_param param;
711 struct srp_login_req priv;
712 } *req = NULL;
713 int status;
714
715 req = kzalloc(sizeof *req, GFP_KERNEL);
716 if (!req)
717 return -ENOMEM;
718
719 req->param.primary_path = &ch->path;
720 req->param.alternate_path = NULL;
721 req->param.service_id = target->service_id;
722 req->param.qp_num = ch->qp->qp_num;
723 req->param.qp_type = ch->qp->qp_type;
724 req->param.private_data = &req->priv;
725 req->param.private_data_len = sizeof req->priv;
726 req->param.flow_control = 1;
727
728 get_random_bytes(&req->param.starting_psn, 4);
729 req->param.starting_psn &= 0xffffff;
730
731 /*
732 * Pick some arbitrary defaults here; we could make these
733 * module parameters if anyone cared about setting them.
734 */
735 req->param.responder_resources = 4;
736 req->param.remote_cm_response_timeout = 20;
737 req->param.local_cm_response_timeout = 20;
738 req->param.retry_count = target->tl_retry_count;
739 req->param.rnr_retry_count = 7;
740 req->param.max_cm_retries = 15;
741
742 req->priv.opcode = SRP_LOGIN_REQ;
743 req->priv.tag = 0;
744 req->priv.req_it_iu_len = cpu_to_be32(target->max_iu_len);
745 req->priv.req_buf_fmt = cpu_to_be16(SRP_BUF_FORMAT_DIRECT |
746 SRP_BUF_FORMAT_INDIRECT);
747 req->priv.req_flags = (multich ? SRP_MULTICHAN_MULTI :
748 SRP_MULTICHAN_SINGLE);
749 /*
750 * In the published SRP specification (draft rev. 16a), the
751 * port identifier format is 8 bytes of ID extension followed
752 * by 8 bytes of GUID. Older drafts put the two halves in the
753 * opposite order, so that the GUID comes first.
754 *
755 * Targets conforming to these obsolete drafts can be
756 * recognized by the I/O Class they report.
757 */
758 if (target->io_class == SRP_REV10_IB_IO_CLASS) {
759 memcpy(req->priv.initiator_port_id,
760 &target->sgid.global.interface_id, 8);
761 memcpy(req->priv.initiator_port_id + 8,
762 &target->initiator_ext, 8);
763 memcpy(req->priv.target_port_id, &target->ioc_guid, 8);
764 memcpy(req->priv.target_port_id + 8, &target->id_ext, 8);
765 } else {
766 memcpy(req->priv.initiator_port_id,
767 &target->initiator_ext, 8);
768 memcpy(req->priv.initiator_port_id + 8,
769 &target->sgid.global.interface_id, 8);
770 memcpy(req->priv.target_port_id, &target->id_ext, 8);
771 memcpy(req->priv.target_port_id + 8, &target->ioc_guid, 8);
772 }
773
774 /*
775 * Topspin/Cisco SRP targets will reject our login unless we
776 * zero out the first 8 bytes of our initiator port ID and set
777 * the second 8 bytes to the local node GUID.
778 */
779 if (srp_target_is_topspin(target)) {
780 shost_printk(KERN_DEBUG, target->scsi_host,
781 PFX "Topspin/Cisco initiator port ID workaround "
782 "activated for target GUID %016llx\n",
783 be64_to_cpu(target->ioc_guid));
784 memset(req->priv.initiator_port_id, 0, 8);
785 memcpy(req->priv.initiator_port_id + 8,
786 &target->srp_host->srp_dev->dev->node_guid, 8);
787 }
788
789 status = ib_send_cm_req(ch->cm_id, &req->param);
790
791 kfree(req);
792
793 return status;
794 }
795
796 static bool srp_queue_remove_work(struct srp_target_port *target)
797 {
798 bool changed = false;
799
800 spin_lock_irq(&target->lock);
801 if (target->state != SRP_TARGET_REMOVED) {
802 target->state = SRP_TARGET_REMOVED;
803 changed = true;
804 }
805 spin_unlock_irq(&target->lock);
806
807 if (changed)
808 queue_work(srp_remove_wq, &target->remove_work);
809
810 return changed;
811 }
812
813 static void srp_disconnect_target(struct srp_target_port *target)
814 {
815 struct srp_rdma_ch *ch;
816 int i;
817
818 /* XXX should send SRP_I_LOGOUT request */
819
820 for (i = 0; i < target->ch_count; i++) {
821 ch = &target->ch[i];
822 ch->connected = false;
823 if (ch->cm_id && ib_send_cm_dreq(ch->cm_id, NULL, 0)) {
824 shost_printk(KERN_DEBUG, target->scsi_host,
825 PFX "Sending CM DREQ failed\n");
826 }
827 }
828 }
829
830 static void srp_free_req_data(struct srp_target_port *target,
831 struct srp_rdma_ch *ch)
832 {
833 struct srp_device *dev = target->srp_host->srp_dev;
834 struct ib_device *ibdev = dev->dev;
835 struct srp_request *req;
836 int i;
837
838 if (!ch->req_ring)
839 return;
840
841 for (i = 0; i < target->req_ring_size; ++i) {
842 req = &ch->req_ring[i];
843 if (dev->use_fast_reg) {
844 kfree(req->fr_list);
845 } else {
846 kfree(req->fmr_list);
847 kfree(req->map_page);
848 }
849 if (req->indirect_dma_addr) {
850 ib_dma_unmap_single(ibdev, req->indirect_dma_addr,
851 target->indirect_size,
852 DMA_TO_DEVICE);
853 }
854 kfree(req->indirect_desc);
855 }
856
857 kfree(ch->req_ring);
858 ch->req_ring = NULL;
859 }
860
861 static int srp_alloc_req_data(struct srp_rdma_ch *ch)
862 {
863 struct srp_target_port *target = ch->target;
864 struct srp_device *srp_dev = target->srp_host->srp_dev;
865 struct ib_device *ibdev = srp_dev->dev;
866 struct srp_request *req;
867 void *mr_list;
868 dma_addr_t dma_addr;
869 int i, ret = -ENOMEM;
870
871 ch->req_ring = kcalloc(target->req_ring_size, sizeof(*ch->req_ring),
872 GFP_KERNEL);
873 if (!ch->req_ring)
874 goto out;
875
876 for (i = 0; i < target->req_ring_size; ++i) {
877 req = &ch->req_ring[i];
878 mr_list = kmalloc(target->cmd_sg_cnt * sizeof(void *),
879 GFP_KERNEL);
880 if (!mr_list)
881 goto out;
882 if (srp_dev->use_fast_reg) {
883 req->fr_list = mr_list;
884 } else {
885 req->fmr_list = mr_list;
886 req->map_page = kmalloc(srp_dev->max_pages_per_mr *
887 sizeof(void *), GFP_KERNEL);
888 if (!req->map_page)
889 goto out;
890 }
891 req->indirect_desc = kmalloc(target->indirect_size, GFP_KERNEL);
892 if (!req->indirect_desc)
893 goto out;
894
895 dma_addr = ib_dma_map_single(ibdev, req->indirect_desc,
896 target->indirect_size,
897 DMA_TO_DEVICE);
898 if (ib_dma_mapping_error(ibdev, dma_addr))
899 goto out;
900
901 req->indirect_dma_addr = dma_addr;
902 }
903 ret = 0;
904
905 out:
906 return ret;
907 }
908
909 /**
910 * srp_del_scsi_host_attr() - Remove attributes defined in the host template.
911 * @shost: SCSI host whose attributes to remove from sysfs.
912 *
913 * Note: Any attributes defined in the host template and that did not exist
914 * before invocation of this function will be ignored.
915 */
916 static void srp_del_scsi_host_attr(struct Scsi_Host *shost)
917 {
918 struct device_attribute **attr;
919
920 for (attr = shost->hostt->shost_attrs; attr && *attr; ++attr)
921 device_remove_file(&shost->shost_dev, *attr);
922 }
923
924 static void srp_remove_target(struct srp_target_port *target)
925 {
926 struct srp_rdma_ch *ch;
927 int i;
928
929 WARN_ON_ONCE(target->state != SRP_TARGET_REMOVED);
930
931 srp_del_scsi_host_attr(target->scsi_host);
932 srp_rport_get(target->rport);
933 srp_remove_host(target->scsi_host);
934 scsi_remove_host(target->scsi_host);
935 srp_stop_rport_timers(target->rport);
936 srp_disconnect_target(target);
937 for (i = 0; i < target->ch_count; i++) {
938 ch = &target->ch[i];
939 srp_free_ch_ib(target, ch);
940 }
941 cancel_work_sync(&target->tl_err_work);
942 srp_rport_put(target->rport);
943 for (i = 0; i < target->ch_count; i++) {
944 ch = &target->ch[i];
945 srp_free_req_data(target, ch);
946 }
947 kfree(target->ch);
948 target->ch = NULL;
949
950 spin_lock(&target->srp_host->target_lock);
951 list_del(&target->list);
952 spin_unlock(&target->srp_host->target_lock);
953
954 scsi_host_put(target->scsi_host);
955 }
956
957 static void srp_remove_work(struct work_struct *work)
958 {
959 struct srp_target_port *target =
960 container_of(work, struct srp_target_port, remove_work);
961
962 WARN_ON_ONCE(target->state != SRP_TARGET_REMOVED);
963
964 srp_remove_target(target);
965 }
966
967 static void srp_rport_delete(struct srp_rport *rport)
968 {
969 struct srp_target_port *target = rport->lld_data;
970
971 srp_queue_remove_work(target);
972 }
973
974 /**
975 * srp_connected_ch() - number of connected channels
976 * @target: SRP target port.
977 */
978 static int srp_connected_ch(struct srp_target_port *target)
979 {
980 int i, c = 0;
981
982 for (i = 0; i < target->ch_count; i++)
983 c += target->ch[i].connected;
984
985 return c;
986 }
987
988 static int srp_connect_ch(struct srp_rdma_ch *ch, bool multich)
989 {
990 struct srp_target_port *target = ch->target;
991 int ret;
992
993 WARN_ON_ONCE(!multich && srp_connected_ch(target) > 0);
994
995 ret = srp_lookup_path(ch);
996 if (ret)
997 return ret;
998
999 while (1) {
1000 init_completion(&ch->done);
1001 ret = srp_send_req(ch, multich);
1002 if (ret)
1003 return ret;
1004 ret = wait_for_completion_interruptible(&ch->done);
1005 if (ret < 0)
1006 return ret;
1007
1008 /*
1009 * The CM event handling code will set status to
1010 * SRP_PORT_REDIRECT if we get a port redirect REJ
1011 * back, or SRP_DLID_REDIRECT if we get a lid/qp
1012 * redirect REJ back.
1013 */
1014 switch (ch->status) {
1015 case 0:
1016 ch->connected = true;
1017 return 0;
1018
1019 case SRP_PORT_REDIRECT:
1020 ret = srp_lookup_path(ch);
1021 if (ret)
1022 return ret;
1023 break;
1024
1025 case SRP_DLID_REDIRECT:
1026 break;
1027
1028 case SRP_STALE_CONN:
1029 shost_printk(KERN_ERR, target->scsi_host, PFX
1030 "giving up on stale connection\n");
1031 ch->status = -ECONNRESET;
1032 return ch->status;
1033
1034 default:
1035 return ch->status;
1036 }
1037 }
1038 }
1039
1040 static int srp_inv_rkey(struct srp_rdma_ch *ch, u32 rkey)
1041 {
1042 struct ib_send_wr *bad_wr;
1043 struct ib_send_wr wr = {
1044 .opcode = IB_WR_LOCAL_INV,
1045 .wr_id = LOCAL_INV_WR_ID_MASK,
1046 .next = NULL,
1047 .num_sge = 0,
1048 .send_flags = 0,
1049 .ex.invalidate_rkey = rkey,
1050 };
1051
1052 return ib_post_send(ch->qp, &wr, &bad_wr);
1053 }
1054
1055 static void srp_unmap_data(struct scsi_cmnd *scmnd,
1056 struct srp_rdma_ch *ch,
1057 struct srp_request *req)
1058 {
1059 struct srp_target_port *target = ch->target;
1060 struct srp_device *dev = target->srp_host->srp_dev;
1061 struct ib_device *ibdev = dev->dev;
1062 int i, res;
1063
1064 if (!scsi_sglist(scmnd) ||
1065 (scmnd->sc_data_direction != DMA_TO_DEVICE &&
1066 scmnd->sc_data_direction != DMA_FROM_DEVICE))
1067 return;
1068
1069 if (dev->use_fast_reg) {
1070 struct srp_fr_desc **pfr;
1071
1072 for (i = req->nmdesc, pfr = req->fr_list; i > 0; i--, pfr++) {
1073 res = srp_inv_rkey(ch, (*pfr)->mr->rkey);
1074 if (res < 0) {
1075 shost_printk(KERN_ERR, target->scsi_host, PFX
1076 "Queueing INV WR for rkey %#x failed (%d)\n",
1077 (*pfr)->mr->rkey, res);
1078 queue_work(system_long_wq,
1079 &target->tl_err_work);
1080 }
1081 }
1082 if (req->nmdesc)
1083 srp_fr_pool_put(ch->fr_pool, req->fr_list,
1084 req->nmdesc);
1085 } else if (dev->use_fmr) {
1086 struct ib_pool_fmr **pfmr;
1087
1088 for (i = req->nmdesc, pfmr = req->fmr_list; i > 0; i--, pfmr++)
1089 ib_fmr_pool_unmap(*pfmr);
1090 }
1091
1092 ib_dma_unmap_sg(ibdev, scsi_sglist(scmnd), scsi_sg_count(scmnd),
1093 scmnd->sc_data_direction);
1094 }
1095
1096 /**
1097 * srp_claim_req - Take ownership of the scmnd associated with a request.
1098 * @ch: SRP RDMA channel.
1099 * @req: SRP request.
1100 * @sdev: If not NULL, only take ownership for this SCSI device.
1101 * @scmnd: If NULL, take ownership of @req->scmnd. If not NULL, only take
1102 * ownership of @req->scmnd if it equals @scmnd.
1103 *
1104 * Return value:
1105 * Either NULL or a pointer to the SCSI command the caller became owner of.
1106 */
1107 static struct scsi_cmnd *srp_claim_req(struct srp_rdma_ch *ch,
1108 struct srp_request *req,
1109 struct scsi_device *sdev,
1110 struct scsi_cmnd *scmnd)
1111 {
1112 unsigned long flags;
1113
1114 spin_lock_irqsave(&ch->lock, flags);
1115 if (req->scmnd &&
1116 (!sdev || req->scmnd->device == sdev) &&
1117 (!scmnd || req->scmnd == scmnd)) {
1118 scmnd = req->scmnd;
1119 req->scmnd = NULL;
1120 } else {
1121 scmnd = NULL;
1122 }
1123 spin_unlock_irqrestore(&ch->lock, flags);
1124
1125 return scmnd;
1126 }
1127
1128 /**
1129 * srp_free_req() - Unmap data and add request to the free request list.
1130 * @ch: SRP RDMA channel.
1131 * @req: Request to be freed.
1132 * @scmnd: SCSI command associated with @req.
1133 * @req_lim_delta: Amount to be added to @target->req_lim.
1134 */
1135 static void srp_free_req(struct srp_rdma_ch *ch, struct srp_request *req,
1136 struct scsi_cmnd *scmnd, s32 req_lim_delta)
1137 {
1138 unsigned long flags;
1139
1140 srp_unmap_data(scmnd, ch, req);
1141
1142 spin_lock_irqsave(&ch->lock, flags);
1143 ch->req_lim += req_lim_delta;
1144 spin_unlock_irqrestore(&ch->lock, flags);
1145 }
1146
1147 static void srp_finish_req(struct srp_rdma_ch *ch, struct srp_request *req,
1148 struct scsi_device *sdev, int result)
1149 {
1150 struct scsi_cmnd *scmnd = srp_claim_req(ch, req, sdev, NULL);
1151
1152 if (scmnd) {
1153 srp_free_req(ch, req, scmnd, 0);
1154 scmnd->result = result;
1155 scmnd->scsi_done(scmnd);
1156 }
1157 }
1158
1159 static void srp_terminate_io(struct srp_rport *rport)
1160 {
1161 struct srp_target_port *target = rport->lld_data;
1162 struct srp_rdma_ch *ch;
1163 struct Scsi_Host *shost = target->scsi_host;
1164 struct scsi_device *sdev;
1165 int i, j;
1166
1167 /*
1168 * Invoking srp_terminate_io() while srp_queuecommand() is running
1169 * is not safe. Hence the warning statement below.
1170 */
1171 shost_for_each_device(sdev, shost)
1172 WARN_ON_ONCE(sdev->request_queue->request_fn_active);
1173
1174 for (i = 0; i < target->ch_count; i++) {
1175 ch = &target->ch[i];
1176
1177 for (j = 0; j < target->req_ring_size; ++j) {
1178 struct srp_request *req = &ch->req_ring[j];
1179
1180 srp_finish_req(ch, req, NULL,
1181 DID_TRANSPORT_FAILFAST << 16);
1182 }
1183 }
1184 }
1185
1186 /*
1187 * It is up to the caller to ensure that srp_rport_reconnect() calls are
1188 * serialized and that no concurrent srp_queuecommand(), srp_abort(),
1189 * srp_reset_device() or srp_reset_host() calls will occur while this function
1190 * is in progress. One way to realize that is not to call this function
1191 * directly but to call srp_reconnect_rport() instead since that last function
1192 * serializes calls of this function via rport->mutex and also blocks
1193 * srp_queuecommand() calls before invoking this function.
1194 */
1195 static int srp_rport_reconnect(struct srp_rport *rport)
1196 {
1197 struct srp_target_port *target = rport->lld_data;
1198 struct srp_rdma_ch *ch;
1199 int i, j, ret = 0;
1200 bool multich = false;
1201
1202 srp_disconnect_target(target);
1203
1204 if (target->state == SRP_TARGET_SCANNING)
1205 return -ENODEV;
1206
1207 /*
1208 * Now get a new local CM ID so that we avoid confusing the target in
1209 * case things are really fouled up. Doing so also ensures that all CM
1210 * callbacks will have finished before a new QP is allocated.
1211 */
1212 for (i = 0; i < target->ch_count; i++) {
1213 ch = &target->ch[i];
1214 ret += srp_new_cm_id(ch);
1215 }
1216 for (i = 0; i < target->ch_count; i++) {
1217 ch = &target->ch[i];
1218 for (j = 0; j < target->req_ring_size; ++j) {
1219 struct srp_request *req = &ch->req_ring[j];
1220
1221 srp_finish_req(ch, req, NULL, DID_RESET << 16);
1222 }
1223 }
1224 for (i = 0; i < target->ch_count; i++) {
1225 ch = &target->ch[i];
1226 /*
1227 * Whether or not creating a new CM ID succeeded, create a new
1228 * QP. This guarantees that all completion callback function
1229 * invocations have finished before request resetting starts.
1230 */
1231 ret += srp_create_ch_ib(ch);
1232
1233 INIT_LIST_HEAD(&ch->free_tx);
1234 for (j = 0; j < target->queue_size; ++j)
1235 list_add(&ch->tx_ring[j]->list, &ch->free_tx);
1236 }
1237
1238 target->qp_in_error = false;
1239
1240 for (i = 0; i < target->ch_count; i++) {
1241 ch = &target->ch[i];
1242 if (ret)
1243 break;
1244 ret = srp_connect_ch(ch, multich);
1245 multich = true;
1246 }
1247
1248 if (ret == 0)
1249 shost_printk(KERN_INFO, target->scsi_host,
1250 PFX "reconnect succeeded\n");
1251
1252 return ret;
1253 }
1254
1255 static void srp_map_desc(struct srp_map_state *state, dma_addr_t dma_addr,
1256 unsigned int dma_len, u32 rkey)
1257 {
1258 struct srp_direct_buf *desc = state->desc;
1259
1260 WARN_ON_ONCE(!dma_len);
1261
1262 desc->va = cpu_to_be64(dma_addr);
1263 desc->key = cpu_to_be32(rkey);
1264 desc->len = cpu_to_be32(dma_len);
1265
1266 state->total_len += dma_len;
1267 state->desc++;
1268 state->ndesc++;
1269 }
1270
1271 static int srp_map_finish_fmr(struct srp_map_state *state,
1272 struct srp_rdma_ch *ch)
1273 {
1274 struct srp_target_port *target = ch->target;
1275 struct srp_device *dev = target->srp_host->srp_dev;
1276 struct ib_pool_fmr *fmr;
1277 u64 io_addr = 0;
1278
1279 if (state->fmr.next >= state->fmr.end)
1280 return -ENOMEM;
1281
1282 WARN_ON_ONCE(!dev->use_fmr);
1283
1284 if (state->npages == 0)
1285 return 0;
1286
1287 if (state->npages == 1 && target->global_mr) {
1288 srp_map_desc(state, state->base_dma_addr, state->dma_len,
1289 target->global_mr->rkey);
1290 goto reset_state;
1291 }
1292
1293 fmr = ib_fmr_pool_map_phys(ch->fmr_pool, state->pages,
1294 state->npages, io_addr);
1295 if (IS_ERR(fmr))
1296 return PTR_ERR(fmr);
1297
1298 *state->fmr.next++ = fmr;
1299 state->nmdesc++;
1300
1301 srp_map_desc(state, state->base_dma_addr & ~dev->mr_page_mask,
1302 state->dma_len, fmr->fmr->rkey);
1303
1304 reset_state:
1305 state->npages = 0;
1306 state->dma_len = 0;
1307
1308 return 0;
1309 }
1310
1311 static int srp_map_finish_fr(struct srp_map_state *state,
1312 struct srp_rdma_ch *ch)
1313 {
1314 struct srp_target_port *target = ch->target;
1315 struct srp_device *dev = target->srp_host->srp_dev;
1316 struct ib_send_wr *bad_wr;
1317 struct ib_reg_wr wr;
1318 struct srp_fr_desc *desc;
1319 u32 rkey;
1320 int n, err;
1321
1322 if (state->fr.next >= state->fr.end)
1323 return -ENOMEM;
1324
1325 WARN_ON_ONCE(!dev->use_fast_reg);
1326
1327 if (state->sg_nents == 0)
1328 return 0;
1329
1330 if (state->sg_nents == 1 && target->global_mr) {
1331 srp_map_desc(state, sg_dma_address(state->sg),
1332 sg_dma_len(state->sg),
1333 target->global_mr->rkey);
1334 return 1;
1335 }
1336
1337 desc = srp_fr_pool_get(ch->fr_pool);
1338 if (!desc)
1339 return -ENOMEM;
1340
1341 rkey = ib_inc_rkey(desc->mr->rkey);
1342 ib_update_fast_reg_key(desc->mr, rkey);
1343
1344 n = ib_map_mr_sg(desc->mr, state->sg, state->sg_nents,
1345 dev->mr_page_size);
1346 if (unlikely(n < 0))
1347 return n;
1348
1349 wr.wr.next = NULL;
1350 wr.wr.opcode = IB_WR_REG_MR;
1351 wr.wr.wr_id = FAST_REG_WR_ID_MASK;
1352 wr.wr.num_sge = 0;
1353 wr.wr.send_flags = 0;
1354 wr.mr = desc->mr;
1355 wr.key = desc->mr->rkey;
1356 wr.access = (IB_ACCESS_LOCAL_WRITE |
1357 IB_ACCESS_REMOTE_READ |
1358 IB_ACCESS_REMOTE_WRITE);
1359
1360 *state->fr.next++ = desc;
1361 state->nmdesc++;
1362
1363 srp_map_desc(state, desc->mr->iova,
1364 desc->mr->length, desc->mr->rkey);
1365
1366 err = ib_post_send(ch->qp, &wr.wr, &bad_wr);
1367 if (unlikely(err))
1368 return err;
1369
1370 return n;
1371 }
1372
1373 static int srp_map_sg_entry(struct srp_map_state *state,
1374 struct srp_rdma_ch *ch,
1375 struct scatterlist *sg, int sg_index)
1376 {
1377 struct srp_target_port *target = ch->target;
1378 struct srp_device *dev = target->srp_host->srp_dev;
1379 struct ib_device *ibdev = dev->dev;
1380 dma_addr_t dma_addr = ib_sg_dma_address(ibdev, sg);
1381 unsigned int dma_len = ib_sg_dma_len(ibdev, sg);
1382 unsigned int len = 0;
1383 int ret;
1384
1385 WARN_ON_ONCE(!dma_len);
1386
1387 while (dma_len) {
1388 unsigned offset = dma_addr & ~dev->mr_page_mask;
1389 if (state->npages == dev->max_pages_per_mr || offset != 0) {
1390 ret = srp_map_finish_fmr(state, ch);
1391 if (ret)
1392 return ret;
1393 }
1394
1395 len = min_t(unsigned int, dma_len, dev->mr_page_size - offset);
1396
1397 if (!state->npages)
1398 state->base_dma_addr = dma_addr;
1399 state->pages[state->npages++] = dma_addr & dev->mr_page_mask;
1400 state->dma_len += len;
1401 dma_addr += len;
1402 dma_len -= len;
1403 }
1404
1405 /*
1406 * If the last entry of the MR wasn't a full page, then we need to
1407 * close it out and start a new one -- we can only merge at page
1408 * boundries.
1409 */
1410 ret = 0;
1411 if (len != dev->mr_page_size)
1412 ret = srp_map_finish_fmr(state, ch);
1413 return ret;
1414 }
1415
1416 static int srp_map_sg_fmr(struct srp_map_state *state, struct srp_rdma_ch *ch,
1417 struct srp_request *req, struct scatterlist *scat,
1418 int count)
1419 {
1420 struct scatterlist *sg;
1421 int i, ret;
1422
1423 state->desc = req->indirect_desc;
1424 state->pages = req->map_page;
1425 state->fmr.next = req->fmr_list;
1426 state->fmr.end = req->fmr_list + ch->target->cmd_sg_cnt;
1427
1428 for_each_sg(scat, sg, count, i) {
1429 ret = srp_map_sg_entry(state, ch, sg, i);
1430 if (ret)
1431 return ret;
1432 }
1433
1434 ret = srp_map_finish_fmr(state, ch);
1435 if (ret)
1436 return ret;
1437
1438 req->nmdesc = state->nmdesc;
1439
1440 return 0;
1441 }
1442
1443 static int srp_map_sg_fr(struct srp_map_state *state, struct srp_rdma_ch *ch,
1444 struct srp_request *req, struct scatterlist *scat,
1445 int count)
1446 {
1447 state->desc = req->indirect_desc;
1448 state->fr.next = req->fr_list;
1449 state->fr.end = req->fr_list + ch->target->cmd_sg_cnt;
1450 state->sg = scat;
1451 state->sg_nents = scsi_sg_count(req->scmnd);
1452
1453 while (state->sg_nents) {
1454 int i, n;
1455
1456 n = srp_map_finish_fr(state, ch);
1457 if (unlikely(n < 0))
1458 return n;
1459
1460 state->sg_nents -= n;
1461 for (i = 0; i < n; i++)
1462 state->sg = sg_next(state->sg);
1463 }
1464
1465 req->nmdesc = state->nmdesc;
1466
1467 return 0;
1468 }
1469
1470 static int srp_map_sg_dma(struct srp_map_state *state, struct srp_rdma_ch *ch,
1471 struct srp_request *req, struct scatterlist *scat,
1472 int count)
1473 {
1474 struct srp_target_port *target = ch->target;
1475 struct srp_device *dev = target->srp_host->srp_dev;
1476 struct scatterlist *sg;
1477 int i;
1478
1479 state->desc = req->indirect_desc;
1480 for_each_sg(scat, sg, count, i) {
1481 srp_map_desc(state, ib_sg_dma_address(dev->dev, sg),
1482 ib_sg_dma_len(dev->dev, sg),
1483 target->global_mr->rkey);
1484 }
1485
1486 req->nmdesc = state->nmdesc;
1487
1488 return 0;
1489 }
1490
1491 /*
1492 * Register the indirect data buffer descriptor with the HCA.
1493 *
1494 * Note: since the indirect data buffer descriptor has been allocated with
1495 * kmalloc() it is guaranteed that this buffer is a physically contiguous
1496 * memory buffer.
1497 */
1498 static int srp_map_idb(struct srp_rdma_ch *ch, struct srp_request *req,
1499 void **next_mr, void **end_mr, u32 idb_len,
1500 __be32 *idb_rkey)
1501 {
1502 struct srp_target_port *target = ch->target;
1503 struct srp_device *dev = target->srp_host->srp_dev;
1504 struct srp_map_state state;
1505 struct srp_direct_buf idb_desc;
1506 u64 idb_pages[1];
1507 struct scatterlist idb_sg[1];
1508 int ret;
1509
1510 memset(&state, 0, sizeof(state));
1511 memset(&idb_desc, 0, sizeof(idb_desc));
1512 state.gen.next = next_mr;
1513 state.gen.end = end_mr;
1514 state.desc = &idb_desc;
1515 state.base_dma_addr = req->indirect_dma_addr;
1516 state.dma_len = idb_len;
1517
1518 if (dev->use_fast_reg) {
1519 state.sg = idb_sg;
1520 state.sg_nents = 1;
1521 sg_set_buf(idb_sg, req->indirect_desc, idb_len);
1522 idb_sg->dma_address = req->indirect_dma_addr; /* hack! */
1523 ret = srp_map_finish_fr(&state, ch);
1524 if (ret < 0)
1525 return ret;
1526 } else if (dev->use_fmr) {
1527 state.pages = idb_pages;
1528 state.pages[0] = (req->indirect_dma_addr &
1529 dev->mr_page_mask);
1530 state.npages = 1;
1531 ret = srp_map_finish_fmr(&state, ch);
1532 if (ret < 0)
1533 return ret;
1534 } else {
1535 return -EINVAL;
1536 }
1537
1538 *idb_rkey = idb_desc.key;
1539
1540 return 0;
1541 }
1542
1543 static int srp_map_data(struct scsi_cmnd *scmnd, struct srp_rdma_ch *ch,
1544 struct srp_request *req)
1545 {
1546 struct srp_target_port *target = ch->target;
1547 struct scatterlist *scat;
1548 struct srp_cmd *cmd = req->cmd->buf;
1549 int len, nents, count, ret;
1550 struct srp_device *dev;
1551 struct ib_device *ibdev;
1552 struct srp_map_state state;
1553 struct srp_indirect_buf *indirect_hdr;
1554 u32 idb_len, table_len;
1555 __be32 idb_rkey;
1556 u8 fmt;
1557
1558 if (!scsi_sglist(scmnd) || scmnd->sc_data_direction == DMA_NONE)
1559 return sizeof (struct srp_cmd);
1560
1561 if (scmnd->sc_data_direction != DMA_FROM_DEVICE &&
1562 scmnd->sc_data_direction != DMA_TO_DEVICE) {
1563 shost_printk(KERN_WARNING, target->scsi_host,
1564 PFX "Unhandled data direction %d\n",
1565 scmnd->sc_data_direction);
1566 return -EINVAL;
1567 }
1568
1569 nents = scsi_sg_count(scmnd);
1570 scat = scsi_sglist(scmnd);
1571
1572 dev = target->srp_host->srp_dev;
1573 ibdev = dev->dev;
1574
1575 count = ib_dma_map_sg(ibdev, scat, nents, scmnd->sc_data_direction);
1576 if (unlikely(count == 0))
1577 return -EIO;
1578
1579 fmt = SRP_DATA_DESC_DIRECT;
1580 len = sizeof (struct srp_cmd) + sizeof (struct srp_direct_buf);
1581
1582 if (count == 1 && target->global_mr) {
1583 /*
1584 * The midlayer only generated a single gather/scatter
1585 * entry, or DMA mapping coalesced everything to a
1586 * single entry. So a direct descriptor along with
1587 * the DMA MR suffices.
1588 */
1589 struct srp_direct_buf *buf = (void *) cmd->add_data;
1590
1591 buf->va = cpu_to_be64(ib_sg_dma_address(ibdev, scat));
1592 buf->key = cpu_to_be32(target->global_mr->rkey);
1593 buf->len = cpu_to_be32(ib_sg_dma_len(ibdev, scat));
1594
1595 req->nmdesc = 0;
1596 goto map_complete;
1597 }
1598
1599 /*
1600 * We have more than one scatter/gather entry, so build our indirect
1601 * descriptor table, trying to merge as many entries as we can.
1602 */
1603 indirect_hdr = (void *) cmd->add_data;
1604
1605 ib_dma_sync_single_for_cpu(ibdev, req->indirect_dma_addr,
1606 target->indirect_size, DMA_TO_DEVICE);
1607
1608 memset(&state, 0, sizeof(state));
1609 if (dev->use_fast_reg)
1610 srp_map_sg_fr(&state, ch, req, scat, count);
1611 else if (dev->use_fmr)
1612 srp_map_sg_fmr(&state, ch, req, scat, count);
1613 else
1614 srp_map_sg_dma(&state, ch, req, scat, count);
1615
1616 /* We've mapped the request, now pull as much of the indirect
1617 * descriptor table as we can into the command buffer. If this
1618 * target is not using an external indirect table, we are
1619 * guaranteed to fit into the command, as the SCSI layer won't
1620 * give us more S/G entries than we allow.
1621 */
1622 if (state.ndesc == 1) {
1623 /*
1624 * Memory registration collapsed the sg-list into one entry,
1625 * so use a direct descriptor.
1626 */
1627 struct srp_direct_buf *buf = (void *) cmd->add_data;
1628
1629 *buf = req->indirect_desc[0];
1630 goto map_complete;
1631 }
1632
1633 if (unlikely(target->cmd_sg_cnt < state.ndesc &&
1634 !target->allow_ext_sg)) {
1635 shost_printk(KERN_ERR, target->scsi_host,
1636 "Could not fit S/G list into SRP_CMD\n");
1637 return -EIO;
1638 }
1639
1640 count = min(state.ndesc, target->cmd_sg_cnt);
1641 table_len = state.ndesc * sizeof (struct srp_direct_buf);
1642 idb_len = sizeof(struct srp_indirect_buf) + table_len;
1643
1644 fmt = SRP_DATA_DESC_INDIRECT;
1645 len = sizeof(struct srp_cmd) + sizeof (struct srp_indirect_buf);
1646 len += count * sizeof (struct srp_direct_buf);
1647
1648 memcpy(indirect_hdr->desc_list, req->indirect_desc,
1649 count * sizeof (struct srp_direct_buf));
1650
1651 if (!target->global_mr) {
1652 ret = srp_map_idb(ch, req, state.gen.next, state.gen.end,
1653 idb_len, &idb_rkey);
1654 if (ret < 0)
1655 return ret;
1656 req->nmdesc++;
1657 } else {
1658 idb_rkey = target->global_mr->rkey;
1659 }
1660
1661 indirect_hdr->table_desc.va = cpu_to_be64(req->indirect_dma_addr);
1662 indirect_hdr->table_desc.key = idb_rkey;
1663 indirect_hdr->table_desc.len = cpu_to_be32(table_len);
1664 indirect_hdr->len = cpu_to_be32(state.total_len);
1665
1666 if (scmnd->sc_data_direction == DMA_TO_DEVICE)
1667 cmd->data_out_desc_cnt = count;
1668 else
1669 cmd->data_in_desc_cnt = count;
1670
1671 ib_dma_sync_single_for_device(ibdev, req->indirect_dma_addr, table_len,
1672 DMA_TO_DEVICE);
1673
1674 map_complete:
1675 if (scmnd->sc_data_direction == DMA_TO_DEVICE)
1676 cmd->buf_fmt = fmt << 4;
1677 else
1678 cmd->buf_fmt = fmt;
1679
1680 return len;
1681 }
1682
1683 /*
1684 * Return an IU and possible credit to the free pool
1685 */
1686 static void srp_put_tx_iu(struct srp_rdma_ch *ch, struct srp_iu *iu,
1687 enum srp_iu_type iu_type)
1688 {
1689 unsigned long flags;
1690
1691 spin_lock_irqsave(&ch->lock, flags);
1692 list_add(&iu->list, &ch->free_tx);
1693 if (iu_type != SRP_IU_RSP)
1694 ++ch->req_lim;
1695 spin_unlock_irqrestore(&ch->lock, flags);
1696 }
1697
1698 /*
1699 * Must be called with ch->lock held to protect req_lim and free_tx.
1700 * If IU is not sent, it must be returned using srp_put_tx_iu().
1701 *
1702 * Note:
1703 * An upper limit for the number of allocated information units for each
1704 * request type is:
1705 * - SRP_IU_CMD: SRP_CMD_SQ_SIZE, since the SCSI mid-layer never queues
1706 * more than Scsi_Host.can_queue requests.
1707 * - SRP_IU_TSK_MGMT: SRP_TSK_MGMT_SQ_SIZE.
1708 * - SRP_IU_RSP: 1, since a conforming SRP target never sends more than
1709 * one unanswered SRP request to an initiator.
1710 */
1711 static struct srp_iu *__srp_get_tx_iu(struct srp_rdma_ch *ch,
1712 enum srp_iu_type iu_type)
1713 {
1714 struct srp_target_port *target = ch->target;
1715 s32 rsv = (iu_type == SRP_IU_TSK_MGMT) ? 0 : SRP_TSK_MGMT_SQ_SIZE;
1716 struct srp_iu *iu;
1717
1718 srp_send_completion(ch->send_cq, ch);
1719
1720 if (list_empty(&ch->free_tx))
1721 return NULL;
1722
1723 /* Initiator responses to target requests do not consume credits */
1724 if (iu_type != SRP_IU_RSP) {
1725 if (ch->req_lim <= rsv) {
1726 ++target->zero_req_lim;
1727 return NULL;
1728 }
1729
1730 --ch->req_lim;
1731 }
1732
1733 iu = list_first_entry(&ch->free_tx, struct srp_iu, list);
1734 list_del(&iu->list);
1735 return iu;
1736 }
1737
1738 static int srp_post_send(struct srp_rdma_ch *ch, struct srp_iu *iu, int len)
1739 {
1740 struct srp_target_port *target = ch->target;
1741 struct ib_sge list;
1742 struct ib_send_wr wr, *bad_wr;
1743
1744 list.addr = iu->dma;
1745 list.length = len;
1746 list.lkey = target->lkey;
1747
1748 wr.next = NULL;
1749 wr.wr_id = (uintptr_t) iu;
1750 wr.sg_list = &list;
1751 wr.num_sge = 1;
1752 wr.opcode = IB_WR_SEND;
1753 wr.send_flags = IB_SEND_SIGNALED;
1754
1755 return ib_post_send(ch->qp, &wr, &bad_wr);
1756 }
1757
1758 static int srp_post_recv(struct srp_rdma_ch *ch, struct srp_iu *iu)
1759 {
1760 struct srp_target_port *target = ch->target;
1761 struct ib_recv_wr wr, *bad_wr;
1762 struct ib_sge list;
1763
1764 list.addr = iu->dma;
1765 list.length = iu->size;
1766 list.lkey = target->lkey;
1767
1768 wr.next = NULL;
1769 wr.wr_id = (uintptr_t) iu;
1770 wr.sg_list = &list;
1771 wr.num_sge = 1;
1772
1773 return ib_post_recv(ch->qp, &wr, &bad_wr);
1774 }
1775
1776 static void srp_process_rsp(struct srp_rdma_ch *ch, struct srp_rsp *rsp)
1777 {
1778 struct srp_target_port *target = ch->target;
1779 struct srp_request *req;
1780 struct scsi_cmnd *scmnd;
1781 unsigned long flags;
1782
1783 if (unlikely(rsp->tag & SRP_TAG_TSK_MGMT)) {
1784 spin_lock_irqsave(&ch->lock, flags);
1785 ch->req_lim += be32_to_cpu(rsp->req_lim_delta);
1786 spin_unlock_irqrestore(&ch->lock, flags);
1787
1788 ch->tsk_mgmt_status = -1;
1789 if (be32_to_cpu(rsp->resp_data_len) >= 4)
1790 ch->tsk_mgmt_status = rsp->data[3];
1791 complete(&ch->tsk_mgmt_done);
1792 } else {
1793 scmnd = scsi_host_find_tag(target->scsi_host, rsp->tag);
1794 if (scmnd) {
1795 req = (void *)scmnd->host_scribble;
1796 scmnd = srp_claim_req(ch, req, NULL, scmnd);
1797 }
1798 if (!scmnd) {
1799 shost_printk(KERN_ERR, target->scsi_host,
1800 "Null scmnd for RSP w/tag %#016llx received on ch %td / QP %#x\n",
1801 rsp->tag, ch - target->ch, ch->qp->qp_num);
1802
1803 spin_lock_irqsave(&ch->lock, flags);
1804 ch->req_lim += be32_to_cpu(rsp->req_lim_delta);
1805 spin_unlock_irqrestore(&ch->lock, flags);
1806
1807 return;
1808 }
1809 scmnd->result = rsp->status;
1810
1811 if (rsp->flags & SRP_RSP_FLAG_SNSVALID) {
1812 memcpy(scmnd->sense_buffer, rsp->data +
1813 be32_to_cpu(rsp->resp_data_len),
1814 min_t(int, be32_to_cpu(rsp->sense_data_len),
1815 SCSI_SENSE_BUFFERSIZE));
1816 }
1817
1818 if (unlikely(rsp->flags & SRP_RSP_FLAG_DIUNDER))
1819 scsi_set_resid(scmnd, be32_to_cpu(rsp->data_in_res_cnt));
1820 else if (unlikely(rsp->flags & SRP_RSP_FLAG_DIOVER))
1821 scsi_set_resid(scmnd, -be32_to_cpu(rsp->data_in_res_cnt));
1822 else if (unlikely(rsp->flags & SRP_RSP_FLAG_DOUNDER))
1823 scsi_set_resid(scmnd, be32_to_cpu(rsp->data_out_res_cnt));
1824 else if (unlikely(rsp->flags & SRP_RSP_FLAG_DOOVER))
1825 scsi_set_resid(scmnd, -be32_to_cpu(rsp->data_out_res_cnt));
1826
1827 srp_free_req(ch, req, scmnd,
1828 be32_to_cpu(rsp->req_lim_delta));
1829
1830 scmnd->host_scribble = NULL;
1831 scmnd->scsi_done(scmnd);
1832 }
1833 }
1834
1835 static int srp_response_common(struct srp_rdma_ch *ch, s32 req_delta,
1836 void *rsp, int len)
1837 {
1838 struct srp_target_port *target = ch->target;
1839 struct ib_device *dev = target->srp_host->srp_dev->dev;
1840 unsigned long flags;
1841 struct srp_iu *iu;
1842 int err;
1843
1844 spin_lock_irqsave(&ch->lock, flags);
1845 ch->req_lim += req_delta;
1846 iu = __srp_get_tx_iu(ch, SRP_IU_RSP);
1847 spin_unlock_irqrestore(&ch->lock, flags);
1848
1849 if (!iu) {
1850 shost_printk(KERN_ERR, target->scsi_host, PFX
1851 "no IU available to send response\n");
1852 return 1;
1853 }
1854
1855 ib_dma_sync_single_for_cpu(dev, iu->dma, len, DMA_TO_DEVICE);
1856 memcpy(iu->buf, rsp, len);
1857 ib_dma_sync_single_for_device(dev, iu->dma, len, DMA_TO_DEVICE);
1858
1859 err = srp_post_send(ch, iu, len);
1860 if (err) {
1861 shost_printk(KERN_ERR, target->scsi_host, PFX
1862 "unable to post response: %d\n", err);
1863 srp_put_tx_iu(ch, iu, SRP_IU_RSP);
1864 }
1865
1866 return err;
1867 }
1868
1869 static void srp_process_cred_req(struct srp_rdma_ch *ch,
1870 struct srp_cred_req *req)
1871 {
1872 struct srp_cred_rsp rsp = {
1873 .opcode = SRP_CRED_RSP,
1874 .tag = req->tag,
1875 };
1876 s32 delta = be32_to_cpu(req->req_lim_delta);
1877
1878 if (srp_response_common(ch, delta, &rsp, sizeof(rsp)))
1879 shost_printk(KERN_ERR, ch->target->scsi_host, PFX
1880 "problems processing SRP_CRED_REQ\n");
1881 }
1882
1883 static void srp_process_aer_req(struct srp_rdma_ch *ch,
1884 struct srp_aer_req *req)
1885 {
1886 struct srp_target_port *target = ch->target;
1887 struct srp_aer_rsp rsp = {
1888 .opcode = SRP_AER_RSP,
1889 .tag = req->tag,
1890 };
1891 s32 delta = be32_to_cpu(req->req_lim_delta);
1892
1893 shost_printk(KERN_ERR, target->scsi_host, PFX
1894 "ignoring AER for LUN %llu\n", scsilun_to_int(&req->lun));
1895
1896 if (srp_response_common(ch, delta, &rsp, sizeof(rsp)))
1897 shost_printk(KERN_ERR, target->scsi_host, PFX
1898 "problems processing SRP_AER_REQ\n");
1899 }
1900
1901 static void srp_handle_recv(struct srp_rdma_ch *ch, struct ib_wc *wc)
1902 {
1903 struct srp_target_port *target = ch->target;
1904 struct ib_device *dev = target->srp_host->srp_dev->dev;
1905 struct srp_iu *iu = (struct srp_iu *) (uintptr_t) wc->wr_id;
1906 int res;
1907 u8 opcode;
1908
1909 ib_dma_sync_single_for_cpu(dev, iu->dma, ch->max_ti_iu_len,
1910 DMA_FROM_DEVICE);
1911
1912 opcode = *(u8 *) iu->buf;
1913
1914 if (0) {
1915 shost_printk(KERN_ERR, target->scsi_host,
1916 PFX "recv completion, opcode 0x%02x\n", opcode);
1917 print_hex_dump(KERN_ERR, "", DUMP_PREFIX_OFFSET, 8, 1,
1918 iu->buf, wc->byte_len, true);
1919 }
1920
1921 switch (opcode) {
1922 case SRP_RSP:
1923 srp_process_rsp(ch, iu->buf);
1924 break;
1925
1926 case SRP_CRED_REQ:
1927 srp_process_cred_req(ch, iu->buf);
1928 break;
1929
1930 case SRP_AER_REQ:
1931 srp_process_aer_req(ch, iu->buf);
1932 break;
1933
1934 case SRP_T_LOGOUT:
1935 /* XXX Handle target logout */
1936 shost_printk(KERN_WARNING, target->scsi_host,
1937 PFX "Got target logout request\n");
1938 break;
1939
1940 default:
1941 shost_printk(KERN_WARNING, target->scsi_host,
1942 PFX "Unhandled SRP opcode 0x%02x\n", opcode);
1943 break;
1944 }
1945
1946 ib_dma_sync_single_for_device(dev, iu->dma, ch->max_ti_iu_len,
1947 DMA_FROM_DEVICE);
1948
1949 res = srp_post_recv(ch, iu);
1950 if (res != 0)
1951 shost_printk(KERN_ERR, target->scsi_host,
1952 PFX "Recv failed with error code %d\n", res);
1953 }
1954
1955 /**
1956 * srp_tl_err_work() - handle a transport layer error
1957 * @work: Work structure embedded in an SRP target port.
1958 *
1959 * Note: This function may get invoked before the rport has been created,
1960 * hence the target->rport test.
1961 */
1962 static void srp_tl_err_work(struct work_struct *work)
1963 {
1964 struct srp_target_port *target;
1965
1966 target = container_of(work, struct srp_target_port, tl_err_work);
1967 if (target->rport)
1968 srp_start_tl_fail_timers(target->rport);
1969 }
1970
1971 static void srp_handle_qp_err(u64 wr_id, enum ib_wc_status wc_status,
1972 bool send_err, struct srp_rdma_ch *ch)
1973 {
1974 struct srp_target_port *target = ch->target;
1975
1976 if (wr_id == SRP_LAST_WR_ID) {
1977 complete(&ch->done);
1978 return;
1979 }
1980
1981 if (ch->connected && !target->qp_in_error) {
1982 if (wr_id & LOCAL_INV_WR_ID_MASK) {
1983 shost_printk(KERN_ERR, target->scsi_host, PFX
1984 "LOCAL_INV failed with status %s (%d)\n",
1985 ib_wc_status_msg(wc_status), wc_status);
1986 } else if (wr_id & FAST_REG_WR_ID_MASK) {
1987 shost_printk(KERN_ERR, target->scsi_host, PFX
1988 "FAST_REG_MR failed status %s (%d)\n",
1989 ib_wc_status_msg(wc_status), wc_status);
1990 } else {
1991 shost_printk(KERN_ERR, target->scsi_host,
1992 PFX "failed %s status %s (%d) for iu %p\n",
1993 send_err ? "send" : "receive",
1994 ib_wc_status_msg(wc_status), wc_status,
1995 (void *)(uintptr_t)wr_id);
1996 }
1997 queue_work(system_long_wq, &target->tl_err_work);
1998 }
1999 target->qp_in_error = true;
2000 }
2001
2002 static void srp_recv_completion(struct ib_cq *cq, void *ch_ptr)
2003 {
2004 struct srp_rdma_ch *ch = ch_ptr;
2005 struct ib_wc wc;
2006
2007 ib_req_notify_cq(cq, IB_CQ_NEXT_COMP);
2008 while (ib_poll_cq(cq, 1, &wc) > 0) {
2009 if (likely(wc.status == IB_WC_SUCCESS)) {
2010 srp_handle_recv(ch, &wc);
2011 } else {
2012 srp_handle_qp_err(wc.wr_id, wc.status, false, ch);
2013 }
2014 }
2015 }
2016
2017 static void srp_send_completion(struct ib_cq *cq, void *ch_ptr)
2018 {
2019 struct srp_rdma_ch *ch = ch_ptr;
2020 struct ib_wc wc;
2021 struct srp_iu *iu;
2022
2023 while (ib_poll_cq(cq, 1, &wc) > 0) {
2024 if (likely(wc.status == IB_WC_SUCCESS)) {
2025 iu = (struct srp_iu *) (uintptr_t) wc.wr_id;
2026 list_add(&iu->list, &ch->free_tx);
2027 } else {
2028 srp_handle_qp_err(wc.wr_id, wc.status, true, ch);
2029 }
2030 }
2031 }
2032
2033 static int srp_queuecommand(struct Scsi_Host *shost, struct scsi_cmnd *scmnd)
2034 {
2035 struct srp_target_port *target = host_to_target(shost);
2036 struct srp_rport *rport = target->rport;
2037 struct srp_rdma_ch *ch;
2038 struct srp_request *req;
2039 struct srp_iu *iu;
2040 struct srp_cmd *cmd;
2041 struct ib_device *dev;
2042 unsigned long flags;
2043 u32 tag;
2044 u16 idx;
2045 int len, ret;
2046 const bool in_scsi_eh = !in_interrupt() && current == shost->ehandler;
2047
2048 /*
2049 * The SCSI EH thread is the only context from which srp_queuecommand()
2050 * can get invoked for blocked devices (SDEV_BLOCK /
2051 * SDEV_CREATED_BLOCK). Avoid racing with srp_reconnect_rport() by
2052 * locking the rport mutex if invoked from inside the SCSI EH.
2053 */
2054 if (in_scsi_eh)
2055 mutex_lock(&rport->mutex);
2056
2057 scmnd->result = srp_chkready(target->rport);
2058 if (unlikely(scmnd->result))
2059 goto err;
2060
2061 WARN_ON_ONCE(scmnd->request->tag < 0);
2062 tag = blk_mq_unique_tag(scmnd->request);
2063 ch = &target->ch[blk_mq_unique_tag_to_hwq(tag)];
2064 idx = blk_mq_unique_tag_to_tag(tag);
2065 WARN_ONCE(idx >= target->req_ring_size, "%s: tag %#x: idx %d >= %d\n",
2066 dev_name(&shost->shost_gendev), tag, idx,
2067 target->req_ring_size);
2068
2069 spin_lock_irqsave(&ch->lock, flags);
2070 iu = __srp_get_tx_iu(ch, SRP_IU_CMD);
2071 spin_unlock_irqrestore(&ch->lock, flags);
2072
2073 if (!iu)
2074 goto err;
2075
2076 req = &ch->req_ring[idx];
2077 dev = target->srp_host->srp_dev->dev;
2078 ib_dma_sync_single_for_cpu(dev, iu->dma, target->max_iu_len,
2079 DMA_TO_DEVICE);
2080
2081 scmnd->host_scribble = (void *) req;
2082
2083 cmd = iu->buf;
2084 memset(cmd, 0, sizeof *cmd);
2085
2086 cmd->opcode = SRP_CMD;
2087 int_to_scsilun(scmnd->device->lun, &cmd->lun);
2088 cmd->tag = tag;
2089 memcpy(cmd->cdb, scmnd->cmnd, scmnd->cmd_len);
2090
2091 req->scmnd = scmnd;
2092 req->cmd = iu;
2093
2094 len = srp_map_data(scmnd, ch, req);
2095 if (len < 0) {
2096 shost_printk(KERN_ERR, target->scsi_host,
2097 PFX "Failed to map data (%d)\n", len);
2098 /*
2099 * If we ran out of memory descriptors (-ENOMEM) because an
2100 * application is queuing many requests with more than
2101 * max_pages_per_mr sg-list elements, tell the SCSI mid-layer
2102 * to reduce queue depth temporarily.
2103 */
2104 scmnd->result = len == -ENOMEM ?
2105 DID_OK << 16 | QUEUE_FULL << 1 : DID_ERROR << 16;
2106 goto err_iu;
2107 }
2108
2109 ib_dma_sync_single_for_device(dev, iu->dma, target->max_iu_len,
2110 DMA_TO_DEVICE);
2111
2112 if (srp_post_send(ch, iu, len)) {
2113 shost_printk(KERN_ERR, target->scsi_host, PFX "Send failed\n");
2114 goto err_unmap;
2115 }
2116
2117 ret = 0;
2118
2119 unlock_rport:
2120 if (in_scsi_eh)
2121 mutex_unlock(&rport->mutex);
2122
2123 return ret;
2124
2125 err_unmap:
2126 srp_unmap_data(scmnd, ch, req);
2127
2128 err_iu:
2129 srp_put_tx_iu(ch, iu, SRP_IU_CMD);
2130
2131 /*
2132 * Avoid that the loops that iterate over the request ring can
2133 * encounter a dangling SCSI command pointer.
2134 */
2135 req->scmnd = NULL;
2136
2137 err:
2138 if (scmnd->result) {
2139 scmnd->scsi_done(scmnd);
2140 ret = 0;
2141 } else {
2142 ret = SCSI_MLQUEUE_HOST_BUSY;
2143 }
2144
2145 goto unlock_rport;
2146 }
2147
2148 /*
2149 * Note: the resources allocated in this function are freed in
2150 * srp_free_ch_ib().
2151 */
2152 static int srp_alloc_iu_bufs(struct srp_rdma_ch *ch)
2153 {
2154 struct srp_target_port *target = ch->target;
2155 int i;
2156
2157 ch->rx_ring = kcalloc(target->queue_size, sizeof(*ch->rx_ring),
2158 GFP_KERNEL);
2159 if (!ch->rx_ring)
2160 goto err_no_ring;
2161 ch->tx_ring = kcalloc(target->queue_size, sizeof(*ch->tx_ring),
2162 GFP_KERNEL);
2163 if (!ch->tx_ring)
2164 goto err_no_ring;
2165
2166 for (i = 0; i < target->queue_size; ++i) {
2167 ch->rx_ring[i] = srp_alloc_iu(target->srp_host,
2168 ch->max_ti_iu_len,
2169 GFP_KERNEL, DMA_FROM_DEVICE);
2170 if (!ch->rx_ring[i])
2171 goto err;
2172 }
2173
2174 for (i = 0; i < target->queue_size; ++i) {
2175 ch->tx_ring[i] = srp_alloc_iu(target->srp_host,
2176 target->max_iu_len,
2177 GFP_KERNEL, DMA_TO_DEVICE);
2178 if (!ch->tx_ring[i])
2179 goto err;
2180
2181 list_add(&ch->tx_ring[i]->list, &ch->free_tx);
2182 }
2183
2184 return 0;
2185
2186 err:
2187 for (i = 0; i < target->queue_size; ++i) {
2188 srp_free_iu(target->srp_host, ch->rx_ring[i]);
2189 srp_free_iu(target->srp_host, ch->tx_ring[i]);
2190 }
2191
2192
2193 err_no_ring:
2194 kfree(ch->tx_ring);
2195 ch->tx_ring = NULL;
2196 kfree(ch->rx_ring);
2197 ch->rx_ring = NULL;
2198
2199 return -ENOMEM;
2200 }
2201
2202 static uint32_t srp_compute_rq_tmo(struct ib_qp_attr *qp_attr, int attr_mask)
2203 {
2204 uint64_t T_tr_ns, max_compl_time_ms;
2205 uint32_t rq_tmo_jiffies;
2206
2207 /*
2208 * According to section 11.2.4.2 in the IBTA spec (Modify Queue Pair,
2209 * table 91), both the QP timeout and the retry count have to be set
2210 * for RC QP's during the RTR to RTS transition.
2211 */
2212 WARN_ON_ONCE((attr_mask & (IB_QP_TIMEOUT | IB_QP_RETRY_CNT)) !=
2213 (IB_QP_TIMEOUT | IB_QP_RETRY_CNT));
2214
2215 /*
2216 * Set target->rq_tmo_jiffies to one second more than the largest time
2217 * it can take before an error completion is generated. See also
2218 * C9-140..142 in the IBTA spec for more information about how to
2219 * convert the QP Local ACK Timeout value to nanoseconds.
2220 */
2221 T_tr_ns = 4096 * (1ULL << qp_attr->timeout);
2222 max_compl_time_ms = qp_attr->retry_cnt * 4 * T_tr_ns;
2223 do_div(max_compl_time_ms, NSEC_PER_MSEC);
2224 rq_tmo_jiffies = msecs_to_jiffies(max_compl_time_ms + 1000);
2225
2226 return rq_tmo_jiffies;
2227 }
2228
2229 static void srp_cm_rep_handler(struct ib_cm_id *cm_id,
2230 const struct srp_login_rsp *lrsp,
2231 struct srp_rdma_ch *ch)
2232 {
2233 struct srp_target_port *target = ch->target;
2234 struct ib_qp_attr *qp_attr = NULL;
2235 int attr_mask = 0;
2236 int ret;
2237 int i;
2238
2239 if (lrsp->opcode == SRP_LOGIN_RSP) {
2240 ch->max_ti_iu_len = be32_to_cpu(lrsp->max_ti_iu_len);
2241 ch->req_lim = be32_to_cpu(lrsp->req_lim_delta);
2242
2243 /*
2244 * Reserve credits for task management so we don't
2245 * bounce requests back to the SCSI mid-layer.
2246 */
2247 target->scsi_host->can_queue
2248 = min(ch->req_lim - SRP_TSK_MGMT_SQ_SIZE,
2249 target->scsi_host->can_queue);
2250 target->scsi_host->cmd_per_lun
2251 = min_t(int, target->scsi_host->can_queue,
2252 target->scsi_host->cmd_per_lun);
2253 } else {
2254 shost_printk(KERN_WARNING, target->scsi_host,
2255 PFX "Unhandled RSP opcode %#x\n", lrsp->opcode);
2256 ret = -ECONNRESET;
2257 goto error;
2258 }
2259
2260 if (!ch->rx_ring) {
2261 ret = srp_alloc_iu_bufs(ch);
2262 if (ret)
2263 goto error;
2264 }
2265
2266 ret = -ENOMEM;
2267 qp_attr = kmalloc(sizeof *qp_attr, GFP_KERNEL);
2268 if (!qp_attr)
2269 goto error;
2270
2271 qp_attr->qp_state = IB_QPS_RTR;
2272 ret = ib_cm_init_qp_attr(cm_id, qp_attr, &attr_mask);
2273 if (ret)
2274 goto error_free;
2275
2276 ret = ib_modify_qp(ch->qp, qp_attr, attr_mask);
2277 if (ret)
2278 goto error_free;
2279
2280 for (i = 0; i < target->queue_size; i++) {
2281 struct srp_iu *iu = ch->rx_ring[i];
2282
2283 ret = srp_post_recv(ch, iu);
2284 if (ret)
2285 goto error_free;
2286 }
2287
2288 qp_attr->qp_state = IB_QPS_RTS;
2289 ret = ib_cm_init_qp_attr(cm_id, qp_attr, &attr_mask);
2290 if (ret)
2291 goto error_free;
2292
2293 target->rq_tmo_jiffies = srp_compute_rq_tmo(qp_attr, attr_mask);
2294
2295 ret = ib_modify_qp(ch->qp, qp_attr, attr_mask);
2296 if (ret)
2297 goto error_free;
2298
2299 ret = ib_send_cm_rtu(cm_id, NULL, 0);
2300
2301 error_free:
2302 kfree(qp_attr);
2303
2304 error:
2305 ch->status = ret;
2306 }
2307
2308 static void srp_cm_rej_handler(struct ib_cm_id *cm_id,
2309 struct ib_cm_event *event,
2310 struct srp_rdma_ch *ch)
2311 {
2312 struct srp_target_port *target = ch->target;
2313 struct Scsi_Host *shost = target->scsi_host;
2314 struct ib_class_port_info *cpi;
2315 int opcode;
2316
2317 switch (event->param.rej_rcvd.reason) {
2318 case IB_CM_REJ_PORT_CM_REDIRECT:
2319 cpi = event->param.rej_rcvd.ari;
2320 ch->path.dlid = cpi->redirect_lid;
2321 ch->path.pkey = cpi->redirect_pkey;
2322 cm_id->remote_cm_qpn = be32_to_cpu(cpi->redirect_qp) & 0x00ffffff;
2323 memcpy(ch->path.dgid.raw, cpi->redirect_gid, 16);
2324
2325 ch->status = ch->path.dlid ?
2326 SRP_DLID_REDIRECT : SRP_PORT_REDIRECT;
2327 break;
2328
2329 case IB_CM_REJ_PORT_REDIRECT:
2330 if (srp_target_is_topspin(target)) {
2331 /*
2332 * Topspin/Cisco SRP gateways incorrectly send
2333 * reject reason code 25 when they mean 24
2334 * (port redirect).
2335 */
2336 memcpy(ch->path.dgid.raw,
2337 event->param.rej_rcvd.ari, 16);
2338
2339 shost_printk(KERN_DEBUG, shost,
2340 PFX "Topspin/Cisco redirect to target port GID %016llx%016llx\n",
2341 be64_to_cpu(ch->path.dgid.global.subnet_prefix),
2342 be64_to_cpu(ch->path.dgid.global.interface_id));
2343
2344 ch->status = SRP_PORT_REDIRECT;
2345 } else {
2346 shost_printk(KERN_WARNING, shost,
2347 " REJ reason: IB_CM_REJ_PORT_REDIRECT\n");
2348 ch->status = -ECONNRESET;
2349 }
2350 break;
2351
2352 case IB_CM_REJ_DUPLICATE_LOCAL_COMM_ID:
2353 shost_printk(KERN_WARNING, shost,
2354 " REJ reason: IB_CM_REJ_DUPLICATE_LOCAL_COMM_ID\n");
2355 ch->status = -ECONNRESET;
2356 break;
2357
2358 case IB_CM_REJ_CONSUMER_DEFINED:
2359 opcode = *(u8 *) event->private_data;
2360 if (opcode == SRP_LOGIN_REJ) {
2361 struct srp_login_rej *rej = event->private_data;
2362 u32 reason = be32_to_cpu(rej->reason);
2363
2364 if (reason == SRP_LOGIN_REJ_REQ_IT_IU_LENGTH_TOO_LARGE)
2365 shost_printk(KERN_WARNING, shost,
2366 PFX "SRP_LOGIN_REJ: requested max_it_iu_len too large\n");
2367 else
2368 shost_printk(KERN_WARNING, shost, PFX
2369 "SRP LOGIN from %pI6 to %pI6 REJECTED, reason 0x%08x\n",
2370 target->sgid.raw,
2371 target->orig_dgid.raw, reason);
2372 } else
2373 shost_printk(KERN_WARNING, shost,
2374 " REJ reason: IB_CM_REJ_CONSUMER_DEFINED,"
2375 " opcode 0x%02x\n", opcode);
2376 ch->status = -ECONNRESET;
2377 break;
2378
2379 case IB_CM_REJ_STALE_CONN:
2380 shost_printk(KERN_WARNING, shost, " REJ reason: stale connection\n");
2381 ch->status = SRP_STALE_CONN;
2382 break;
2383
2384 default:
2385 shost_printk(KERN_WARNING, shost, " REJ reason 0x%x\n",
2386 event->param.rej_rcvd.reason);
2387 ch->status = -ECONNRESET;
2388 }
2389 }
2390
2391 static int srp_cm_handler(struct ib_cm_id *cm_id, struct ib_cm_event *event)
2392 {
2393 struct srp_rdma_ch *ch = cm_id->context;
2394 struct srp_target_port *target = ch->target;
2395 int comp = 0;
2396
2397 switch (event->event) {
2398 case IB_CM_REQ_ERROR:
2399 shost_printk(KERN_DEBUG, target->scsi_host,
2400 PFX "Sending CM REQ failed\n");
2401 comp = 1;
2402 ch->status = -ECONNRESET;
2403 break;
2404
2405 case IB_CM_REP_RECEIVED:
2406 comp = 1;
2407 srp_cm_rep_handler(cm_id, event->private_data, ch);
2408 break;
2409
2410 case IB_CM_REJ_RECEIVED:
2411 shost_printk(KERN_DEBUG, target->scsi_host, PFX "REJ received\n");
2412 comp = 1;
2413
2414 srp_cm_rej_handler(cm_id, event, ch);
2415 break;
2416
2417 case IB_CM_DREQ_RECEIVED:
2418 shost_printk(KERN_WARNING, target->scsi_host,
2419 PFX "DREQ received - connection closed\n");
2420 ch->connected = false;
2421 if (ib_send_cm_drep(cm_id, NULL, 0))
2422 shost_printk(KERN_ERR, target->scsi_host,
2423 PFX "Sending CM DREP failed\n");
2424 queue_work(system_long_wq, &target->tl_err_work);
2425 break;
2426
2427 case IB_CM_TIMEWAIT_EXIT:
2428 shost_printk(KERN_ERR, target->scsi_host,
2429 PFX "connection closed\n");
2430 comp = 1;
2431
2432 ch->status = 0;
2433 break;
2434
2435 case IB_CM_MRA_RECEIVED:
2436 case IB_CM_DREQ_ERROR:
2437 case IB_CM_DREP_RECEIVED:
2438 break;
2439
2440 default:
2441 shost_printk(KERN_WARNING, target->scsi_host,
2442 PFX "Unhandled CM event %d\n", event->event);
2443 break;
2444 }
2445
2446 if (comp)
2447 complete(&ch->done);
2448
2449 return 0;
2450 }
2451
2452 /**
2453 * srp_change_queue_depth - setting device queue depth
2454 * @sdev: scsi device struct
2455 * @qdepth: requested queue depth
2456 *
2457 * Returns queue depth.
2458 */
2459 static int
2460 srp_change_queue_depth(struct scsi_device *sdev, int qdepth)
2461 {
2462 if (!sdev->tagged_supported)
2463 qdepth = 1;
2464 return scsi_change_queue_depth(sdev, qdepth);
2465 }
2466
2467 static int srp_send_tsk_mgmt(struct srp_rdma_ch *ch, u64 req_tag, u64 lun,
2468 u8 func)
2469 {
2470 struct srp_target_port *target = ch->target;
2471 struct srp_rport *rport = target->rport;
2472 struct ib_device *dev = target->srp_host->srp_dev->dev;
2473 struct srp_iu *iu;
2474 struct srp_tsk_mgmt *tsk_mgmt;
2475
2476 if (!ch->connected || target->qp_in_error)
2477 return -1;
2478
2479 init_completion(&ch->tsk_mgmt_done);
2480
2481 /*
2482 * Lock the rport mutex to avoid that srp_create_ch_ib() is
2483 * invoked while a task management function is being sent.
2484 */
2485 mutex_lock(&rport->mutex);
2486 spin_lock_irq(&ch->lock);
2487 iu = __srp_get_tx_iu(ch, SRP_IU_TSK_MGMT);
2488 spin_unlock_irq(&ch->lock);
2489
2490 if (!iu) {
2491 mutex_unlock(&rport->mutex);
2492
2493 return -1;
2494 }
2495
2496 ib_dma_sync_single_for_cpu(dev, iu->dma, sizeof *tsk_mgmt,
2497 DMA_TO_DEVICE);
2498 tsk_mgmt = iu->buf;
2499 memset(tsk_mgmt, 0, sizeof *tsk_mgmt);
2500
2501 tsk_mgmt->opcode = SRP_TSK_MGMT;
2502 int_to_scsilun(lun, &tsk_mgmt->lun);
2503 tsk_mgmt->tag = req_tag | SRP_TAG_TSK_MGMT;
2504 tsk_mgmt->tsk_mgmt_func = func;
2505 tsk_mgmt->task_tag = req_tag;
2506
2507 ib_dma_sync_single_for_device(dev, iu->dma, sizeof *tsk_mgmt,
2508 DMA_TO_DEVICE);
2509 if (srp_post_send(ch, iu, sizeof(*tsk_mgmt))) {
2510 srp_put_tx_iu(ch, iu, SRP_IU_TSK_MGMT);
2511 mutex_unlock(&rport->mutex);
2512
2513 return -1;
2514 }
2515 mutex_unlock(&rport->mutex);
2516
2517 if (!wait_for_completion_timeout(&ch->tsk_mgmt_done,
2518 msecs_to_jiffies(SRP_ABORT_TIMEOUT_MS)))
2519 return -1;
2520
2521 return 0;
2522 }
2523
2524 static int srp_abort(struct scsi_cmnd *scmnd)
2525 {
2526 struct srp_target_port *target = host_to_target(scmnd->device->host);
2527 struct srp_request *req = (struct srp_request *) scmnd->host_scribble;
2528 u32 tag;
2529 u16 ch_idx;
2530 struct srp_rdma_ch *ch;
2531 int ret;
2532
2533 shost_printk(KERN_ERR, target->scsi_host, "SRP abort called\n");
2534
2535 if (!req)
2536 return SUCCESS;
2537 tag = blk_mq_unique_tag(scmnd->request);
2538 ch_idx = blk_mq_unique_tag_to_hwq(tag);
2539 if (WARN_ON_ONCE(ch_idx >= target->ch_count))
2540 return SUCCESS;
2541 ch = &target->ch[ch_idx];
2542 if (!srp_claim_req(ch, req, NULL, scmnd))
2543 return SUCCESS;
2544 shost_printk(KERN_ERR, target->scsi_host,
2545 "Sending SRP abort for tag %#x\n", tag);
2546 if (srp_send_tsk_mgmt(ch, tag, scmnd->device->lun,
2547 SRP_TSK_ABORT_TASK) == 0)
2548 ret = SUCCESS;
2549 else if (target->rport->state == SRP_RPORT_LOST)
2550 ret = FAST_IO_FAIL;
2551 else
2552 ret = FAILED;
2553 srp_free_req(ch, req, scmnd, 0);
2554 scmnd->result = DID_ABORT << 16;
2555 scmnd->scsi_done(scmnd);
2556
2557 return ret;
2558 }
2559
2560 static int srp_reset_device(struct scsi_cmnd *scmnd)
2561 {
2562 struct srp_target_port *target = host_to_target(scmnd->device->host);
2563 struct srp_rdma_ch *ch;
2564 int i;
2565
2566 shost_printk(KERN_ERR, target->scsi_host, "SRP reset_device called\n");
2567
2568 ch = &target->ch[0];
2569 if (srp_send_tsk_mgmt(ch, SRP_TAG_NO_REQ, scmnd->device->lun,
2570 SRP_TSK_LUN_RESET))
2571 return FAILED;
2572 if (ch->tsk_mgmt_status)
2573 return FAILED;
2574
2575 for (i = 0; i < target->ch_count; i++) {
2576 ch = &target->ch[i];
2577 for (i = 0; i < target->req_ring_size; ++i) {
2578 struct srp_request *req = &ch->req_ring[i];
2579
2580 srp_finish_req(ch, req, scmnd->device, DID_RESET << 16);
2581 }
2582 }
2583
2584 return SUCCESS;
2585 }
2586
2587 static int srp_reset_host(struct scsi_cmnd *scmnd)
2588 {
2589 struct srp_target_port *target = host_to_target(scmnd->device->host);
2590
2591 shost_printk(KERN_ERR, target->scsi_host, PFX "SRP reset_host called\n");
2592
2593 return srp_reconnect_rport(target->rport) == 0 ? SUCCESS : FAILED;
2594 }
2595
2596 static int srp_slave_configure(struct scsi_device *sdev)
2597 {
2598 struct Scsi_Host *shost = sdev->host;
2599 struct srp_target_port *target = host_to_target(shost);
2600 struct request_queue *q = sdev->request_queue;
2601 unsigned long timeout;
2602
2603 if (sdev->type == TYPE_DISK) {
2604 timeout = max_t(unsigned, 30 * HZ, target->rq_tmo_jiffies);
2605 blk_queue_rq_timeout(q, timeout);
2606 }
2607
2608 return 0;
2609 }
2610
2611 static ssize_t show_id_ext(struct device *dev, struct device_attribute *attr,
2612 char *buf)
2613 {
2614 struct srp_target_port *target = host_to_target(class_to_shost(dev));
2615
2616 return sprintf(buf, "0x%016llx\n", be64_to_cpu(target->id_ext));
2617 }
2618
2619 static ssize_t show_ioc_guid(struct device *dev, struct device_attribute *attr,
2620 char *buf)
2621 {
2622 struct srp_target_port *target = host_to_target(class_to_shost(dev));
2623
2624 return sprintf(buf, "0x%016llx\n", be64_to_cpu(target->ioc_guid));
2625 }
2626
2627 static ssize_t show_service_id(struct device *dev,
2628 struct device_attribute *attr, char *buf)
2629 {
2630 struct srp_target_port *target = host_to_target(class_to_shost(dev));
2631
2632 return sprintf(buf, "0x%016llx\n", be64_to_cpu(target->service_id));
2633 }
2634
2635 static ssize_t show_pkey(struct device *dev, struct device_attribute *attr,
2636 char *buf)
2637 {
2638 struct srp_target_port *target = host_to_target(class_to_shost(dev));
2639
2640 return sprintf(buf, "0x%04x\n", be16_to_cpu(target->pkey));
2641 }
2642
2643 static ssize_t show_sgid(struct device *dev, struct device_attribute *attr,
2644 char *buf)
2645 {
2646 struct srp_target_port *target = host_to_target(class_to_shost(dev));
2647
2648 return sprintf(buf, "%pI6\n", target->sgid.raw);
2649 }
2650
2651 static ssize_t show_dgid(struct device *dev, struct device_attribute *attr,
2652 char *buf)
2653 {
2654 struct srp_target_port *target = host_to_target(class_to_shost(dev));
2655 struct srp_rdma_ch *ch = &target->ch[0];
2656
2657 return sprintf(buf, "%pI6\n", ch->path.dgid.raw);
2658 }
2659
2660 static ssize_t show_orig_dgid(struct device *dev,
2661 struct device_attribute *attr, char *buf)
2662 {
2663 struct srp_target_port *target = host_to_target(class_to_shost(dev));
2664
2665 return sprintf(buf, "%pI6\n", target->orig_dgid.raw);
2666 }
2667
2668 static ssize_t show_req_lim(struct device *dev,
2669 struct device_attribute *attr, char *buf)
2670 {
2671 struct srp_target_port *target = host_to_target(class_to_shost(dev));
2672 struct srp_rdma_ch *ch;
2673 int i, req_lim = INT_MAX;
2674
2675 for (i = 0; i < target->ch_count; i++) {
2676 ch = &target->ch[i];
2677 req_lim = min(req_lim, ch->req_lim);
2678 }
2679 return sprintf(buf, "%d\n", req_lim);
2680 }
2681
2682 static ssize_t show_zero_req_lim(struct device *dev,
2683 struct device_attribute *attr, char *buf)
2684 {
2685 struct srp_target_port *target = host_to_target(class_to_shost(dev));
2686
2687 return sprintf(buf, "%d\n", target->zero_req_lim);
2688 }
2689
2690 static ssize_t show_local_ib_port(struct device *dev,
2691 struct device_attribute *attr, char *buf)
2692 {
2693 struct srp_target_port *target = host_to_target(class_to_shost(dev));
2694
2695 return sprintf(buf, "%d\n", target->srp_host->port);
2696 }
2697
2698 static ssize_t show_local_ib_device(struct device *dev,
2699 struct device_attribute *attr, char *buf)
2700 {
2701 struct srp_target_port *target = host_to_target(class_to_shost(dev));
2702
2703 return sprintf(buf, "%s\n", target->srp_host->srp_dev->dev->name);
2704 }
2705
2706 static ssize_t show_ch_count(struct device *dev, struct device_attribute *attr,
2707 char *buf)
2708 {
2709 struct srp_target_port *target = host_to_target(class_to_shost(dev));
2710
2711 return sprintf(buf, "%d\n", target->ch_count);
2712 }
2713
2714 static ssize_t show_comp_vector(struct device *dev,
2715 struct device_attribute *attr, char *buf)
2716 {
2717 struct srp_target_port *target = host_to_target(class_to_shost(dev));
2718
2719 return sprintf(buf, "%d\n", target->comp_vector);
2720 }
2721
2722 static ssize_t show_tl_retry_count(struct device *dev,
2723 struct device_attribute *attr, char *buf)
2724 {
2725 struct srp_target_port *target = host_to_target(class_to_shost(dev));
2726
2727 return sprintf(buf, "%d\n", target->tl_retry_count);
2728 }
2729
2730 static ssize_t show_cmd_sg_entries(struct device *dev,
2731 struct device_attribute *attr, char *buf)
2732 {
2733 struct srp_target_port *target = host_to_target(class_to_shost(dev));
2734
2735 return sprintf(buf, "%u\n", target->cmd_sg_cnt);
2736 }
2737
2738 static ssize_t show_allow_ext_sg(struct device *dev,
2739 struct device_attribute *attr, char *buf)
2740 {
2741 struct srp_target_port *target = host_to_target(class_to_shost(dev));
2742
2743 return sprintf(buf, "%s\n", target->allow_ext_sg ? "true" : "false");
2744 }
2745
2746 static DEVICE_ATTR(id_ext, S_IRUGO, show_id_ext, NULL);
2747 static DEVICE_ATTR(ioc_guid, S_IRUGO, show_ioc_guid, NULL);
2748 static DEVICE_ATTR(service_id, S_IRUGO, show_service_id, NULL);
2749 static DEVICE_ATTR(pkey, S_IRUGO, show_pkey, NULL);
2750 static DEVICE_ATTR(sgid, S_IRUGO, show_sgid, NULL);
2751 static DEVICE_ATTR(dgid, S_IRUGO, show_dgid, NULL);
2752 static DEVICE_ATTR(orig_dgid, S_IRUGO, show_orig_dgid, NULL);
2753 static DEVICE_ATTR(req_lim, S_IRUGO, show_req_lim, NULL);
2754 static DEVICE_ATTR(zero_req_lim, S_IRUGO, show_zero_req_lim, NULL);
2755 static DEVICE_ATTR(local_ib_port, S_IRUGO, show_local_ib_port, NULL);
2756 static DEVICE_ATTR(local_ib_device, S_IRUGO, show_local_ib_device, NULL);
2757 static DEVICE_ATTR(ch_count, S_IRUGO, show_ch_count, NULL);
2758 static DEVICE_ATTR(comp_vector, S_IRUGO, show_comp_vector, NULL);
2759 static DEVICE_ATTR(tl_retry_count, S_IRUGO, show_tl_retry_count, NULL);
2760 static DEVICE_ATTR(cmd_sg_entries, S_IRUGO, show_cmd_sg_entries, NULL);
2761 static DEVICE_ATTR(allow_ext_sg, S_IRUGO, show_allow_ext_sg, NULL);
2762
2763 static struct device_attribute *srp_host_attrs[] = {
2764 &dev_attr_id_ext,
2765 &dev_attr_ioc_guid,
2766 &dev_attr_service_id,
2767 &dev_attr_pkey,
2768 &dev_attr_sgid,
2769 &dev_attr_dgid,
2770 &dev_attr_orig_dgid,
2771 &dev_attr_req_lim,
2772 &dev_attr_zero_req_lim,
2773 &dev_attr_local_ib_port,
2774 &dev_attr_local_ib_device,
2775 &dev_attr_ch_count,
2776 &dev_attr_comp_vector,
2777 &dev_attr_tl_retry_count,
2778 &dev_attr_cmd_sg_entries,
2779 &dev_attr_allow_ext_sg,
2780 NULL
2781 };
2782
2783 static struct scsi_host_template srp_template = {
2784 .module = THIS_MODULE,
2785 .name = "InfiniBand SRP initiator",
2786 .proc_name = DRV_NAME,
2787 .slave_configure = srp_slave_configure,
2788 .info = srp_target_info,
2789 .queuecommand = srp_queuecommand,
2790 .change_queue_depth = srp_change_queue_depth,
2791 .eh_abort_handler = srp_abort,
2792 .eh_device_reset_handler = srp_reset_device,
2793 .eh_host_reset_handler = srp_reset_host,
2794 .skip_settle_delay = true,
2795 .sg_tablesize = SRP_DEF_SG_TABLESIZE,
2796 .can_queue = SRP_DEFAULT_CMD_SQ_SIZE,
2797 .this_id = -1,
2798 .cmd_per_lun = SRP_DEFAULT_CMD_SQ_SIZE,
2799 .use_clustering = ENABLE_CLUSTERING,
2800 .shost_attrs = srp_host_attrs,
2801 .use_blk_tags = 1,
2802 .track_queue_depth = 1,
2803 };
2804
2805 static int srp_sdev_count(struct Scsi_Host *host)
2806 {
2807 struct scsi_device *sdev;
2808 int c = 0;
2809
2810 shost_for_each_device(sdev, host)
2811 c++;
2812
2813 return c;
2814 }
2815
2816 /*
2817 * Return values:
2818 * < 0 upon failure. Caller is responsible for SRP target port cleanup.
2819 * 0 and target->state == SRP_TARGET_REMOVED if asynchronous target port
2820 * removal has been scheduled.
2821 * 0 and target->state != SRP_TARGET_REMOVED upon success.
2822 */
2823 static int srp_add_target(struct srp_host *host, struct srp_target_port *target)
2824 {
2825 struct srp_rport_identifiers ids;
2826 struct srp_rport *rport;
2827
2828 target->state = SRP_TARGET_SCANNING;
2829 sprintf(target->target_name, "SRP.T10:%016llX",
2830 be64_to_cpu(target->id_ext));
2831
2832 if (scsi_add_host(target->scsi_host, host->srp_dev->dev->dma_device))
2833 return -ENODEV;
2834
2835 memcpy(ids.port_id, &target->id_ext, 8);
2836 memcpy(ids.port_id + 8, &target->ioc_guid, 8);
2837 ids.roles = SRP_RPORT_ROLE_TARGET;
2838 rport = srp_rport_add(target->scsi_host, &ids);
2839 if (IS_ERR(rport)) {
2840 scsi_remove_host(target->scsi_host);
2841 return PTR_ERR(rport);
2842 }
2843
2844 rport->lld_data = target;
2845 target->rport = rport;
2846
2847 spin_lock(&host->target_lock);
2848 list_add_tail(&target->list, &host->target_list);
2849 spin_unlock(&host->target_lock);
2850
2851 scsi_scan_target(&target->scsi_host->shost_gendev,
2852 0, target->scsi_id, SCAN_WILD_CARD, 0);
2853
2854 if (srp_connected_ch(target) < target->ch_count ||
2855 target->qp_in_error) {
2856 shost_printk(KERN_INFO, target->scsi_host,
2857 PFX "SCSI scan failed - removing SCSI host\n");
2858 srp_queue_remove_work(target);
2859 goto out;
2860 }
2861
2862 pr_debug(PFX "%s: SCSI scan succeeded - detected %d LUNs\n",
2863 dev_name(&target->scsi_host->shost_gendev),
2864 srp_sdev_count(target->scsi_host));
2865
2866 spin_lock_irq(&target->lock);
2867 if (target->state == SRP_TARGET_SCANNING)
2868 target->state = SRP_TARGET_LIVE;
2869 spin_unlock_irq(&target->lock);
2870
2871 out:
2872 return 0;
2873 }
2874
2875 static void srp_release_dev(struct device *dev)
2876 {
2877 struct srp_host *host =
2878 container_of(dev, struct srp_host, dev);
2879
2880 complete(&host->released);
2881 }
2882
2883 static struct class srp_class = {
2884 .name = "infiniband_srp",
2885 .dev_release = srp_release_dev
2886 };
2887
2888 /**
2889 * srp_conn_unique() - check whether the connection to a target is unique
2890 * @host: SRP host.
2891 * @target: SRP target port.
2892 */
2893 static bool srp_conn_unique(struct srp_host *host,
2894 struct srp_target_port *target)
2895 {
2896 struct srp_target_port *t;
2897 bool ret = false;
2898
2899 if (target->state == SRP_TARGET_REMOVED)
2900 goto out;
2901
2902 ret = true;
2903
2904 spin_lock(&host->target_lock);
2905 list_for_each_entry(t, &host->target_list, list) {
2906 if (t != target &&
2907 target->id_ext == t->id_ext &&
2908 target->ioc_guid == t->ioc_guid &&
2909 target->initiator_ext == t->initiator_ext) {
2910 ret = false;
2911 break;
2912 }
2913 }
2914 spin_unlock(&host->target_lock);
2915
2916 out:
2917 return ret;
2918 }
2919
2920 /*
2921 * Target ports are added by writing
2922 *
2923 * id_ext=<SRP ID ext>,ioc_guid=<SRP IOC GUID>,dgid=<dest GID>,
2924 * pkey=<P_Key>,service_id=<service ID>
2925 *
2926 * to the add_target sysfs attribute.
2927 */
2928 enum {
2929 SRP_OPT_ERR = 0,
2930 SRP_OPT_ID_EXT = 1 << 0,
2931 SRP_OPT_IOC_GUID = 1 << 1,
2932 SRP_OPT_DGID = 1 << 2,
2933 SRP_OPT_PKEY = 1 << 3,
2934 SRP_OPT_SERVICE_ID = 1 << 4,
2935 SRP_OPT_MAX_SECT = 1 << 5,
2936 SRP_OPT_MAX_CMD_PER_LUN = 1 << 6,
2937 SRP_OPT_IO_CLASS = 1 << 7,
2938 SRP_OPT_INITIATOR_EXT = 1 << 8,
2939 SRP_OPT_CMD_SG_ENTRIES = 1 << 9,
2940 SRP_OPT_ALLOW_EXT_SG = 1 << 10,
2941 SRP_OPT_SG_TABLESIZE = 1 << 11,
2942 SRP_OPT_COMP_VECTOR = 1 << 12,
2943 SRP_OPT_TL_RETRY_COUNT = 1 << 13,
2944 SRP_OPT_QUEUE_SIZE = 1 << 14,
2945 SRP_OPT_ALL = (SRP_OPT_ID_EXT |
2946 SRP_OPT_IOC_GUID |
2947 SRP_OPT_DGID |
2948 SRP_OPT_PKEY |
2949 SRP_OPT_SERVICE_ID),
2950 };
2951
2952 static const match_table_t srp_opt_tokens = {
2953 { SRP_OPT_ID_EXT, "id_ext=%s" },
2954 { SRP_OPT_IOC_GUID, "ioc_guid=%s" },
2955 { SRP_OPT_DGID, "dgid=%s" },
2956 { SRP_OPT_PKEY, "pkey=%x" },
2957 { SRP_OPT_SERVICE_ID, "service_id=%s" },
2958 { SRP_OPT_MAX_SECT, "max_sect=%d" },
2959 { SRP_OPT_MAX_CMD_PER_LUN, "max_cmd_per_lun=%d" },
2960 { SRP_OPT_IO_CLASS, "io_class=%x" },
2961 { SRP_OPT_INITIATOR_EXT, "initiator_ext=%s" },
2962 { SRP_OPT_CMD_SG_ENTRIES, "cmd_sg_entries=%u" },
2963 { SRP_OPT_ALLOW_EXT_SG, "allow_ext_sg=%u" },
2964 { SRP_OPT_SG_TABLESIZE, "sg_tablesize=%u" },
2965 { SRP_OPT_COMP_VECTOR, "comp_vector=%u" },
2966 { SRP_OPT_TL_RETRY_COUNT, "tl_retry_count=%u" },
2967 { SRP_OPT_QUEUE_SIZE, "queue_size=%d" },
2968 { SRP_OPT_ERR, NULL }
2969 };
2970
2971 static int srp_parse_options(const char *buf, struct srp_target_port *target)
2972 {
2973 char *options, *sep_opt;
2974 char *p;
2975 char dgid[3];
2976 substring_t args[MAX_OPT_ARGS];
2977 int opt_mask = 0;
2978 int token;
2979 int ret = -EINVAL;
2980 int i;
2981
2982 options = kstrdup(buf, GFP_KERNEL);
2983 if (!options)
2984 return -ENOMEM;
2985
2986 sep_opt = options;
2987 while ((p = strsep(&sep_opt, ",\n")) != NULL) {
2988 if (!*p)
2989 continue;
2990
2991 token = match_token(p, srp_opt_tokens, args);
2992 opt_mask |= token;
2993
2994 switch (token) {
2995 case SRP_OPT_ID_EXT:
2996 p = match_strdup(args);
2997 if (!p) {
2998 ret = -ENOMEM;
2999 goto out;
3000 }
3001 target->id_ext = cpu_to_be64(simple_strtoull(p, NULL, 16));
3002 kfree(p);
3003 break;
3004
3005 case SRP_OPT_IOC_GUID:
3006 p = match_strdup(args);
3007 if (!p) {
3008 ret = -ENOMEM;
3009 goto out;
3010 }
3011 target->ioc_guid = cpu_to_be64(simple_strtoull(p, NULL, 16));
3012 kfree(p);
3013 break;
3014
3015 case SRP_OPT_DGID:
3016 p = match_strdup(args);
3017 if (!p) {
3018 ret = -ENOMEM;
3019 goto out;
3020 }
3021 if (strlen(p) != 32) {
3022 pr_warn("bad dest GID parameter '%s'\n", p);
3023 kfree(p);
3024 goto out;
3025 }
3026
3027 for (i = 0; i < 16; ++i) {
3028 strlcpy(dgid, p + i * 2, sizeof(dgid));
3029 if (sscanf(dgid, "%hhx",
3030 &target->orig_dgid.raw[i]) < 1) {
3031 ret = -EINVAL;
3032 kfree(p);
3033 goto out;
3034 }
3035 }
3036 kfree(p);
3037 break;
3038
3039 case SRP_OPT_PKEY:
3040 if (match_hex(args, &token)) {
3041 pr_warn("bad P_Key parameter '%s'\n", p);
3042 goto out;
3043 }
3044 target->pkey = cpu_to_be16(token);
3045 break;
3046
3047 case SRP_OPT_SERVICE_ID:
3048 p = match_strdup(args);
3049 if (!p) {
3050 ret = -ENOMEM;
3051 goto out;
3052 }
3053 target->service_id = cpu_to_be64(simple_strtoull(p, NULL, 16));
3054 kfree(p);
3055 break;
3056
3057 case SRP_OPT_MAX_SECT:
3058 if (match_int(args, &token)) {
3059 pr_warn("bad max sect parameter '%s'\n", p);
3060 goto out;
3061 }
3062 target->scsi_host->max_sectors = token;
3063 break;
3064
3065 case SRP_OPT_QUEUE_SIZE:
3066 if (match_int(args, &token) || token < 1) {
3067 pr_warn("bad queue_size parameter '%s'\n", p);
3068 goto out;
3069 }
3070 target->scsi_host->can_queue = token;
3071 target->queue_size = token + SRP_RSP_SQ_SIZE +
3072 SRP_TSK_MGMT_SQ_SIZE;
3073 if (!(opt_mask & SRP_OPT_MAX_CMD_PER_LUN))
3074 target->scsi_host->cmd_per_lun = token;
3075 break;
3076
3077 case SRP_OPT_MAX_CMD_PER_LUN:
3078 if (match_int(args, &token) || token < 1) {
3079 pr_warn("bad max cmd_per_lun parameter '%s'\n",
3080 p);
3081 goto out;
3082 }
3083 target->scsi_host->cmd_per_lun = token;
3084 break;
3085
3086 case SRP_OPT_IO_CLASS:
3087 if (match_hex(args, &token)) {
3088 pr_warn("bad IO class parameter '%s'\n", p);
3089 goto out;
3090 }
3091 if (token != SRP_REV10_IB_IO_CLASS &&
3092 token != SRP_REV16A_IB_IO_CLASS) {
3093 pr_warn("unknown IO class parameter value %x specified (use %x or %x).\n",
3094 token, SRP_REV10_IB_IO_CLASS,
3095 SRP_REV16A_IB_IO_CLASS);
3096 goto out;
3097 }
3098 target->io_class = token;
3099 break;
3100
3101 case SRP_OPT_INITIATOR_EXT:
3102 p = match_strdup(args);
3103 if (!p) {
3104 ret = -ENOMEM;
3105 goto out;
3106 }
3107 target->initiator_ext = cpu_to_be64(simple_strtoull(p, NULL, 16));
3108 kfree(p);
3109 break;
3110
3111 case SRP_OPT_CMD_SG_ENTRIES:
3112 if (match_int(args, &token) || token < 1 || token > 255) {
3113 pr_warn("bad max cmd_sg_entries parameter '%s'\n",
3114 p);
3115 goto out;
3116 }
3117 target->cmd_sg_cnt = token;
3118 break;
3119
3120 case SRP_OPT_ALLOW_EXT_SG:
3121 if (match_int(args, &token)) {
3122 pr_warn("bad allow_ext_sg parameter '%s'\n", p);
3123 goto out;
3124 }
3125 target->allow_ext_sg = !!token;
3126 break;
3127
3128 case SRP_OPT_SG_TABLESIZE:
3129 if (match_int(args, &token) || token < 1 ||
3130 token > SCSI_MAX_SG_CHAIN_SEGMENTS) {
3131 pr_warn("bad max sg_tablesize parameter '%s'\n",
3132 p);
3133 goto out;
3134 }
3135 target->sg_tablesize = token;
3136 break;
3137
3138 case SRP_OPT_COMP_VECTOR:
3139 if (match_int(args, &token) || token < 0) {
3140 pr_warn("bad comp_vector parameter '%s'\n", p);
3141 goto out;
3142 }
3143 target->comp_vector = token;
3144 break;
3145
3146 case SRP_OPT_TL_RETRY_COUNT:
3147 if (match_int(args, &token) || token < 2 || token > 7) {
3148 pr_warn("bad tl_retry_count parameter '%s' (must be a number between 2 and 7)\n",
3149 p);
3150 goto out;
3151 }
3152 target->tl_retry_count = token;
3153 break;
3154
3155 default:
3156 pr_warn("unknown parameter or missing value '%s' in target creation request\n",
3157 p);
3158 goto out;
3159 }
3160 }
3161
3162 if ((opt_mask & SRP_OPT_ALL) == SRP_OPT_ALL)
3163 ret = 0;
3164 else
3165 for (i = 0; i < ARRAY_SIZE(srp_opt_tokens); ++i)
3166 if ((srp_opt_tokens[i].token & SRP_OPT_ALL) &&
3167 !(srp_opt_tokens[i].token & opt_mask))
3168 pr_warn("target creation request is missing parameter '%s'\n",
3169 srp_opt_tokens[i].pattern);
3170
3171 if (target->scsi_host->cmd_per_lun > target->scsi_host->can_queue
3172 && (opt_mask & SRP_OPT_MAX_CMD_PER_LUN))
3173 pr_warn("cmd_per_lun = %d > queue_size = %d\n",
3174 target->scsi_host->cmd_per_lun,
3175 target->scsi_host->can_queue);
3176
3177 out:
3178 kfree(options);
3179 return ret;
3180 }
3181
3182 static ssize_t srp_create_target(struct device *dev,
3183 struct device_attribute *attr,
3184 const char *buf, size_t count)
3185 {
3186 struct srp_host *host =
3187 container_of(dev, struct srp_host, dev);
3188 struct Scsi_Host *target_host;
3189 struct srp_target_port *target;
3190 struct srp_rdma_ch *ch;
3191 struct srp_device *srp_dev = host->srp_dev;
3192 struct ib_device *ibdev = srp_dev->dev;
3193 int ret, node_idx, node, cpu, i;
3194 bool multich = false;
3195
3196 target_host = scsi_host_alloc(&srp_template,
3197 sizeof (struct srp_target_port));
3198 if (!target_host)
3199 return -ENOMEM;
3200
3201 target_host->transportt = ib_srp_transport_template;
3202 target_host->max_channel = 0;
3203 target_host->max_id = 1;
3204 target_host->max_lun = -1LL;
3205 target_host->max_cmd_len = sizeof ((struct srp_cmd *) (void *) 0L)->cdb;
3206
3207 target = host_to_target(target_host);
3208
3209 target->io_class = SRP_REV16A_IB_IO_CLASS;
3210 target->scsi_host = target_host;
3211 target->srp_host = host;
3212 target->lkey = host->srp_dev->pd->local_dma_lkey;
3213 target->global_mr = host->srp_dev->global_mr;
3214 target->cmd_sg_cnt = cmd_sg_entries;
3215 target->sg_tablesize = indirect_sg_entries ? : cmd_sg_entries;
3216 target->allow_ext_sg = allow_ext_sg;
3217 target->tl_retry_count = 7;
3218 target->queue_size = SRP_DEFAULT_QUEUE_SIZE;
3219
3220 /*
3221 * Avoid that the SCSI host can be removed by srp_remove_target()
3222 * before this function returns.
3223 */
3224 scsi_host_get(target->scsi_host);
3225
3226 mutex_lock(&host->add_target_mutex);
3227
3228 ret = srp_parse_options(buf, target);
3229 if (ret)
3230 goto out;
3231
3232 ret = scsi_init_shared_tag_map(target_host, target_host->can_queue);
3233 if (ret)
3234 goto out;
3235
3236 target->req_ring_size = target->queue_size - SRP_TSK_MGMT_SQ_SIZE;
3237
3238 if (!srp_conn_unique(target->srp_host, target)) {
3239 shost_printk(KERN_INFO, target->scsi_host,
3240 PFX "Already connected to target port with id_ext=%016llx;ioc_guid=%016llx;initiator_ext=%016llx\n",
3241 be64_to_cpu(target->id_ext),
3242 be64_to_cpu(target->ioc_guid),
3243 be64_to_cpu(target->initiator_ext));
3244 ret = -EEXIST;
3245 goto out;
3246 }
3247
3248 if (!srp_dev->has_fmr && !srp_dev->has_fr && !target->allow_ext_sg &&
3249 target->cmd_sg_cnt < target->sg_tablesize) {
3250 pr_warn("No MR pool and no external indirect descriptors, limiting sg_tablesize to cmd_sg_cnt\n");
3251 target->sg_tablesize = target->cmd_sg_cnt;
3252 }
3253
3254 target_host->sg_tablesize = target->sg_tablesize;
3255 target->indirect_size = target->sg_tablesize *
3256 sizeof (struct srp_direct_buf);
3257 target->max_iu_len = sizeof (struct srp_cmd) +
3258 sizeof (struct srp_indirect_buf) +
3259 target->cmd_sg_cnt * sizeof (struct srp_direct_buf);
3260
3261 INIT_WORK(&target->tl_err_work, srp_tl_err_work);
3262 INIT_WORK(&target->remove_work, srp_remove_work);
3263 spin_lock_init(&target->lock);
3264 ret = ib_query_gid(ibdev, host->port, 0, &target->sgid, NULL);
3265 if (ret)
3266 goto out;
3267
3268 ret = -ENOMEM;
3269 target->ch_count = max_t(unsigned, num_online_nodes(),
3270 min(ch_count ? :
3271 min(4 * num_online_nodes(),
3272 ibdev->num_comp_vectors),
3273 num_online_cpus()));
3274 target->ch = kcalloc(target->ch_count, sizeof(*target->ch),
3275 GFP_KERNEL);
3276 if (!target->ch)
3277 goto out;
3278
3279 node_idx = 0;
3280 for_each_online_node(node) {
3281 const int ch_start = (node_idx * target->ch_count /
3282 num_online_nodes());
3283 const int ch_end = ((node_idx + 1) * target->ch_count /
3284 num_online_nodes());
3285 const int cv_start = (node_idx * ibdev->num_comp_vectors /
3286 num_online_nodes() + target->comp_vector)
3287 % ibdev->num_comp_vectors;
3288 const int cv_end = ((node_idx + 1) * ibdev->num_comp_vectors /
3289 num_online_nodes() + target->comp_vector)
3290 % ibdev->num_comp_vectors;
3291 int cpu_idx = 0;
3292
3293 for_each_online_cpu(cpu) {
3294 if (cpu_to_node(cpu) != node)
3295 continue;
3296 if (ch_start + cpu_idx >= ch_end)
3297 continue;
3298 ch = &target->ch[ch_start + cpu_idx];
3299 ch->target = target;
3300 ch->comp_vector = cv_start == cv_end ? cv_start :
3301 cv_start + cpu_idx % (cv_end - cv_start);
3302 spin_lock_init(&ch->lock);
3303 INIT_LIST_HEAD(&ch->free_tx);
3304 ret = srp_new_cm_id(ch);
3305 if (ret)
3306 goto err_disconnect;
3307
3308 ret = srp_create_ch_ib(ch);
3309 if (ret)
3310 goto err_disconnect;
3311
3312 ret = srp_alloc_req_data(ch);
3313 if (ret)
3314 goto err_disconnect;
3315
3316 ret = srp_connect_ch(ch, multich);
3317 if (ret) {
3318 shost_printk(KERN_ERR, target->scsi_host,
3319 PFX "Connection %d/%d failed\n",
3320 ch_start + cpu_idx,
3321 target->ch_count);
3322 if (node_idx == 0 && cpu_idx == 0) {
3323 goto err_disconnect;
3324 } else {
3325 srp_free_ch_ib(target, ch);
3326 srp_free_req_data(target, ch);
3327 target->ch_count = ch - target->ch;
3328 goto connected;
3329 }
3330 }
3331
3332 multich = true;
3333 cpu_idx++;
3334 }
3335 node_idx++;
3336 }
3337
3338 connected:
3339 target->scsi_host->nr_hw_queues = target->ch_count;
3340
3341 ret = srp_add_target(host, target);
3342 if (ret)
3343 goto err_disconnect;
3344
3345 if (target->state != SRP_TARGET_REMOVED) {
3346 shost_printk(KERN_DEBUG, target->scsi_host, PFX
3347 "new target: id_ext %016llx ioc_guid %016llx pkey %04x service_id %016llx sgid %pI6 dgid %pI6\n",
3348 be64_to_cpu(target->id_ext),
3349 be64_to_cpu(target->ioc_guid),
3350 be16_to_cpu(target->pkey),
3351 be64_to_cpu(target->service_id),
3352 target->sgid.raw, target->orig_dgid.raw);
3353 }
3354
3355 ret = count;
3356
3357 out:
3358 mutex_unlock(&host->add_target_mutex);
3359
3360 scsi_host_put(target->scsi_host);
3361 if (ret < 0)
3362 scsi_host_put(target->scsi_host);
3363
3364 return ret;
3365
3366 err_disconnect:
3367 srp_disconnect_target(target);
3368
3369 for (i = 0; i < target->ch_count; i++) {
3370 ch = &target->ch[i];
3371 srp_free_ch_ib(target, ch);
3372 srp_free_req_data(target, ch);
3373 }
3374
3375 kfree(target->ch);
3376 goto out;
3377 }
3378
3379 static DEVICE_ATTR(add_target, S_IWUSR, NULL, srp_create_target);
3380
3381 static ssize_t show_ibdev(struct device *dev, struct device_attribute *attr,
3382 char *buf)
3383 {
3384 struct srp_host *host = container_of(dev, struct srp_host, dev);
3385
3386 return sprintf(buf, "%s\n", host->srp_dev->dev->name);
3387 }
3388
3389 static DEVICE_ATTR(ibdev, S_IRUGO, show_ibdev, NULL);
3390
3391 static ssize_t show_port(struct device *dev, struct device_attribute *attr,
3392 char *buf)
3393 {
3394 struct srp_host *host = container_of(dev, struct srp_host, dev);
3395
3396 return sprintf(buf, "%d\n", host->port);
3397 }
3398
3399 static DEVICE_ATTR(port, S_IRUGO, show_port, NULL);
3400
3401 static struct srp_host *srp_add_port(struct srp_device *device, u8 port)
3402 {
3403 struct srp_host *host;
3404
3405 host = kzalloc(sizeof *host, GFP_KERNEL);
3406 if (!host)
3407 return NULL;
3408
3409 INIT_LIST_HEAD(&host->target_list);
3410 spin_lock_init(&host->target_lock);
3411 init_completion(&host->released);
3412 mutex_init(&host->add_target_mutex);
3413 host->srp_dev = device;
3414 host->port = port;
3415
3416 host->dev.class = &srp_class;
3417 host->dev.parent = device->dev->dma_device;
3418 dev_set_name(&host->dev, "srp-%s-%d", device->dev->name, port);
3419
3420 if (device_register(&host->dev))
3421 goto free_host;
3422 if (device_create_file(&host->dev, &dev_attr_add_target))
3423 goto err_class;
3424 if (device_create_file(&host->dev, &dev_attr_ibdev))
3425 goto err_class;
3426 if (device_create_file(&host->dev, &dev_attr_port))
3427 goto err_class;
3428
3429 return host;
3430
3431 err_class:
3432 device_unregister(&host->dev);
3433
3434 free_host:
3435 kfree(host);
3436
3437 return NULL;
3438 }
3439
3440 static void srp_add_one(struct ib_device *device)
3441 {
3442 struct srp_device *srp_dev;
3443 struct ib_device_attr *dev_attr;
3444 struct srp_host *host;
3445 int mr_page_shift, p;
3446 u64 max_pages_per_mr;
3447
3448 dev_attr = kmalloc(sizeof *dev_attr, GFP_KERNEL);
3449 if (!dev_attr)
3450 return;
3451
3452 if (ib_query_device(device, dev_attr)) {
3453 pr_warn("Query device failed for %s\n", device->name);
3454 goto free_attr;
3455 }
3456
3457 srp_dev = kmalloc(sizeof *srp_dev, GFP_KERNEL);
3458 if (!srp_dev)
3459 goto free_attr;
3460
3461 srp_dev->has_fmr = (device->alloc_fmr && device->dealloc_fmr &&
3462 device->map_phys_fmr && device->unmap_fmr);
3463 srp_dev->has_fr = (dev_attr->device_cap_flags &
3464 IB_DEVICE_MEM_MGT_EXTENSIONS);
3465 if (!srp_dev->has_fmr && !srp_dev->has_fr)
3466 dev_warn(&device->dev, "neither FMR nor FR is supported\n");
3467
3468 srp_dev->use_fast_reg = (srp_dev->has_fr &&
3469 (!srp_dev->has_fmr || prefer_fr));
3470 srp_dev->use_fmr = !srp_dev->use_fast_reg && srp_dev->has_fmr;
3471
3472 /*
3473 * Use the smallest page size supported by the HCA, down to a
3474 * minimum of 4096 bytes. We're unlikely to build large sglists
3475 * out of smaller entries.
3476 */
3477 mr_page_shift = max(12, ffs(dev_attr->page_size_cap) - 1);
3478 srp_dev->mr_page_size = 1 << mr_page_shift;
3479 srp_dev->mr_page_mask = ~((u64) srp_dev->mr_page_size - 1);
3480 max_pages_per_mr = dev_attr->max_mr_size;
3481 do_div(max_pages_per_mr, srp_dev->mr_page_size);
3482 srp_dev->max_pages_per_mr = min_t(u64, SRP_MAX_PAGES_PER_MR,
3483 max_pages_per_mr);
3484 if (srp_dev->use_fast_reg) {
3485 srp_dev->max_pages_per_mr =
3486 min_t(u32, srp_dev->max_pages_per_mr,
3487 dev_attr->max_fast_reg_page_list_len);
3488 }
3489 srp_dev->mr_max_size = srp_dev->mr_page_size *
3490 srp_dev->max_pages_per_mr;
3491 pr_debug("%s: mr_page_shift = %d, dev_attr->max_mr_size = %#llx, dev_attr->max_fast_reg_page_list_len = %u, max_pages_per_mr = %d, mr_max_size = %#x\n",
3492 device->name, mr_page_shift, dev_attr->max_mr_size,
3493 dev_attr->max_fast_reg_page_list_len,
3494 srp_dev->max_pages_per_mr, srp_dev->mr_max_size);
3495
3496 INIT_LIST_HEAD(&srp_dev->dev_list);
3497
3498 srp_dev->dev = device;
3499 srp_dev->pd = ib_alloc_pd(device);
3500 if (IS_ERR(srp_dev->pd))
3501 goto free_dev;
3502
3503 if (!register_always || (!srp_dev->has_fmr && !srp_dev->has_fr)) {
3504 srp_dev->global_mr = ib_get_dma_mr(srp_dev->pd,
3505 IB_ACCESS_LOCAL_WRITE |
3506 IB_ACCESS_REMOTE_READ |
3507 IB_ACCESS_REMOTE_WRITE);
3508 if (IS_ERR(srp_dev->global_mr))
3509 goto err_pd;
3510 } else {
3511 srp_dev->global_mr = NULL;
3512 }
3513
3514 for (p = rdma_start_port(device); p <= rdma_end_port(device); ++p) {
3515 host = srp_add_port(srp_dev, p);
3516 if (host)
3517 list_add_tail(&host->list, &srp_dev->dev_list);
3518 }
3519
3520 ib_set_client_data(device, &srp_client, srp_dev);
3521
3522 goto free_attr;
3523
3524 err_pd:
3525 ib_dealloc_pd(srp_dev->pd);
3526
3527 free_dev:
3528 kfree(srp_dev);
3529
3530 free_attr:
3531 kfree(dev_attr);
3532 }
3533
3534 static void srp_remove_one(struct ib_device *device, void *client_data)
3535 {
3536 struct srp_device *srp_dev;
3537 struct srp_host *host, *tmp_host;
3538 struct srp_target_port *target;
3539
3540 srp_dev = client_data;
3541 if (!srp_dev)
3542 return;
3543
3544 list_for_each_entry_safe(host, tmp_host, &srp_dev->dev_list, list) {
3545 device_unregister(&host->dev);
3546 /*
3547 * Wait for the sysfs entry to go away, so that no new
3548 * target ports can be created.
3549 */
3550 wait_for_completion(&host->released);
3551
3552 /*
3553 * Remove all target ports.
3554 */
3555 spin_lock(&host->target_lock);
3556 list_for_each_entry(target, &host->target_list, list)
3557 srp_queue_remove_work(target);
3558 spin_unlock(&host->target_lock);
3559
3560 /*
3561 * Wait for tl_err and target port removal tasks.
3562 */
3563 flush_workqueue(system_long_wq);
3564 flush_workqueue(srp_remove_wq);
3565
3566 kfree(host);
3567 }
3568
3569 if (srp_dev->global_mr)
3570 ib_dereg_mr(srp_dev->global_mr);
3571 ib_dealloc_pd(srp_dev->pd);
3572
3573 kfree(srp_dev);
3574 }
3575
3576 static struct srp_function_template ib_srp_transport_functions = {
3577 .has_rport_state = true,
3578 .reset_timer_if_blocked = true,
3579 .reconnect_delay = &srp_reconnect_delay,
3580 .fast_io_fail_tmo = &srp_fast_io_fail_tmo,
3581 .dev_loss_tmo = &srp_dev_loss_tmo,
3582 .reconnect = srp_rport_reconnect,
3583 .rport_delete = srp_rport_delete,
3584 .terminate_rport_io = srp_terminate_io,
3585 };
3586
3587 static int __init srp_init_module(void)
3588 {
3589 int ret;
3590
3591 BUILD_BUG_ON(FIELD_SIZEOF(struct ib_wc, wr_id) < sizeof(void *));
3592
3593 if (srp_sg_tablesize) {
3594 pr_warn("srp_sg_tablesize is deprecated, please use cmd_sg_entries\n");
3595 if (!cmd_sg_entries)
3596 cmd_sg_entries = srp_sg_tablesize;
3597 }
3598
3599 if (!cmd_sg_entries)
3600 cmd_sg_entries = SRP_DEF_SG_TABLESIZE;
3601
3602 if (cmd_sg_entries > 255) {
3603 pr_warn("Clamping cmd_sg_entries to 255\n");
3604 cmd_sg_entries = 255;
3605 }
3606
3607 if (!indirect_sg_entries)
3608 indirect_sg_entries = cmd_sg_entries;
3609 else if (indirect_sg_entries < cmd_sg_entries) {
3610 pr_warn("Bumping up indirect_sg_entries to match cmd_sg_entries (%u)\n",
3611 cmd_sg_entries);
3612 indirect_sg_entries = cmd_sg_entries;
3613 }
3614
3615 srp_remove_wq = create_workqueue("srp_remove");
3616 if (!srp_remove_wq) {
3617 ret = -ENOMEM;
3618 goto out;
3619 }
3620
3621 ret = -ENOMEM;
3622 ib_srp_transport_template =
3623 srp_attach_transport(&ib_srp_transport_functions);
3624 if (!ib_srp_transport_template)
3625 goto destroy_wq;
3626
3627 ret = class_register(&srp_class);
3628 if (ret) {
3629 pr_err("couldn't register class infiniband_srp\n");
3630 goto release_tr;
3631 }
3632
3633 ib_sa_register_client(&srp_sa_client);
3634
3635 ret = ib_register_client(&srp_client);
3636 if (ret) {
3637 pr_err("couldn't register IB client\n");
3638 goto unreg_sa;
3639 }
3640
3641 out:
3642 return ret;
3643
3644 unreg_sa:
3645 ib_sa_unregister_client(&srp_sa_client);
3646 class_unregister(&srp_class);
3647
3648 release_tr:
3649 srp_release_transport(ib_srp_transport_template);
3650
3651 destroy_wq:
3652 destroy_workqueue(srp_remove_wq);
3653 goto out;
3654 }
3655
3656 static void __exit srp_cleanup_module(void)
3657 {
3658 ib_unregister_client(&srp_client);
3659 ib_sa_unregister_client(&srp_sa_client);
3660 class_unregister(&srp_class);
3661 srp_release_transport(ib_srp_transport_template);
3662 destroy_workqueue(srp_remove_wq);
3663 }
3664
3665 module_init(srp_init_module);
3666 module_exit(srp_cleanup_module);
This page took 0.102674 seconds and 6 git commands to generate.