Merge tag 'v4.2-rc8' into x86/mm, before applying new changes
[deliverable/linux.git] / drivers / scsi / cxgbi / libcxgbi.c
1 /*
2 * libcxgbi.c: Chelsio common library for T3/T4 iSCSI driver.
3 *
4 * Copyright (c) 2010-2015 Chelsio Communications, Inc.
5 *
6 * This program is free software; you can redistribute it and/or modify
7 * it under the terms of the GNU General Public License as published by
8 * the Free Software Foundation.
9 *
10 * Written by: Karen Xie (kxie@chelsio.com)
11 * Written by: Rakesh Ranjan (rranjan@chelsio.com)
12 */
13
14 #define pr_fmt(fmt) KBUILD_MODNAME ":%s: " fmt, __func__
15
16 #include <linux/skbuff.h>
17 #include <linux/crypto.h>
18 #include <linux/scatterlist.h>
19 #include <linux/pci.h>
20 #include <scsi/scsi.h>
21 #include <scsi/scsi_cmnd.h>
22 #include <scsi/scsi_host.h>
23 #include <linux/if_vlan.h>
24 #include <linux/inet.h>
25 #include <net/dst.h>
26 #include <net/route.h>
27 #include <net/ipv6.h>
28 #include <net/ip6_route.h>
29 #include <net/addrconf.h>
30
31 #include <linux/inetdevice.h> /* ip_dev_find */
32 #include <linux/module.h>
33 #include <net/tcp.h>
34
35 static unsigned int dbg_level;
36
37 #include "libcxgbi.h"
38
39 #define DRV_MODULE_NAME "libcxgbi"
40 #define DRV_MODULE_DESC "Chelsio iSCSI driver library"
41 #define DRV_MODULE_VERSION "0.9.1-ko"
42 #define DRV_MODULE_RELDATE "Apr. 2015"
43
44 static char version[] =
45 DRV_MODULE_DESC " " DRV_MODULE_NAME
46 " v" DRV_MODULE_VERSION " (" DRV_MODULE_RELDATE ")\n";
47
48 MODULE_AUTHOR("Chelsio Communications, Inc.");
49 MODULE_DESCRIPTION(DRV_MODULE_DESC);
50 MODULE_VERSION(DRV_MODULE_VERSION);
51 MODULE_LICENSE("GPL");
52
53 module_param(dbg_level, uint, 0644);
54 MODULE_PARM_DESC(dbg_level, "libiscsi debug level (default=0)");
55
56
57 /*
58 * cxgbi device management
59 * maintains a list of the cxgbi devices
60 */
61 static LIST_HEAD(cdev_list);
62 static DEFINE_MUTEX(cdev_mutex);
63
64 static LIST_HEAD(cdev_rcu_list);
65 static DEFINE_SPINLOCK(cdev_rcu_lock);
66
67 int cxgbi_device_portmap_create(struct cxgbi_device *cdev, unsigned int base,
68 unsigned int max_conn)
69 {
70 struct cxgbi_ports_map *pmap = &cdev->pmap;
71
72 pmap->port_csk = cxgbi_alloc_big_mem(max_conn *
73 sizeof(struct cxgbi_sock *),
74 GFP_KERNEL);
75 if (!pmap->port_csk) {
76 pr_warn("cdev 0x%p, portmap OOM %u.\n", cdev, max_conn);
77 return -ENOMEM;
78 }
79
80 pmap->max_connect = max_conn;
81 pmap->sport_base = base;
82 spin_lock_init(&pmap->lock);
83 return 0;
84 }
85 EXPORT_SYMBOL_GPL(cxgbi_device_portmap_create);
86
87 void cxgbi_device_portmap_cleanup(struct cxgbi_device *cdev)
88 {
89 struct cxgbi_ports_map *pmap = &cdev->pmap;
90 struct cxgbi_sock *csk;
91 int i;
92
93 for (i = 0; i < pmap->max_connect; i++) {
94 if (pmap->port_csk[i]) {
95 csk = pmap->port_csk[i];
96 pmap->port_csk[i] = NULL;
97 log_debug(1 << CXGBI_DBG_SOCK,
98 "csk 0x%p, cdev 0x%p, offload down.\n",
99 csk, cdev);
100 spin_lock_bh(&csk->lock);
101 cxgbi_sock_set_flag(csk, CTPF_OFFLOAD_DOWN);
102 cxgbi_sock_closed(csk);
103 spin_unlock_bh(&csk->lock);
104 cxgbi_sock_put(csk);
105 }
106 }
107 }
108 EXPORT_SYMBOL_GPL(cxgbi_device_portmap_cleanup);
109
110 static inline void cxgbi_device_destroy(struct cxgbi_device *cdev)
111 {
112 log_debug(1 << CXGBI_DBG_DEV,
113 "cdev 0x%p, p# %u.\n", cdev, cdev->nports);
114 cxgbi_hbas_remove(cdev);
115 cxgbi_device_portmap_cleanup(cdev);
116 if (cdev->dev_ddp_cleanup)
117 cdev->dev_ddp_cleanup(cdev);
118 else
119 cxgbi_ddp_cleanup(cdev);
120 if (cdev->ddp)
121 cxgbi_ddp_cleanup(cdev);
122 if (cdev->pmap.max_connect)
123 cxgbi_free_big_mem(cdev->pmap.port_csk);
124 kfree(cdev);
125 }
126
127 struct cxgbi_device *cxgbi_device_register(unsigned int extra,
128 unsigned int nports)
129 {
130 struct cxgbi_device *cdev;
131
132 cdev = kzalloc(sizeof(*cdev) + extra + nports *
133 (sizeof(struct cxgbi_hba *) +
134 sizeof(struct net_device *)),
135 GFP_KERNEL);
136 if (!cdev) {
137 pr_warn("nport %d, OOM.\n", nports);
138 return NULL;
139 }
140 cdev->ports = (struct net_device **)(cdev + 1);
141 cdev->hbas = (struct cxgbi_hba **)(((char*)cdev->ports) + nports *
142 sizeof(struct net_device *));
143 if (extra)
144 cdev->dd_data = ((char *)cdev->hbas) +
145 nports * sizeof(struct cxgbi_hba *);
146 spin_lock_init(&cdev->pmap.lock);
147
148 mutex_lock(&cdev_mutex);
149 list_add_tail(&cdev->list_head, &cdev_list);
150 mutex_unlock(&cdev_mutex);
151
152 spin_lock(&cdev_rcu_lock);
153 list_add_tail_rcu(&cdev->rcu_node, &cdev_rcu_list);
154 spin_unlock(&cdev_rcu_lock);
155
156 log_debug(1 << CXGBI_DBG_DEV,
157 "cdev 0x%p, p# %u.\n", cdev, nports);
158 return cdev;
159 }
160 EXPORT_SYMBOL_GPL(cxgbi_device_register);
161
162 void cxgbi_device_unregister(struct cxgbi_device *cdev)
163 {
164 log_debug(1 << CXGBI_DBG_DEV,
165 "cdev 0x%p, p# %u,%s.\n",
166 cdev, cdev->nports, cdev->nports ? cdev->ports[0]->name : "");
167
168 mutex_lock(&cdev_mutex);
169 list_del(&cdev->list_head);
170 mutex_unlock(&cdev_mutex);
171
172 spin_lock(&cdev_rcu_lock);
173 list_del_rcu(&cdev->rcu_node);
174 spin_unlock(&cdev_rcu_lock);
175 synchronize_rcu();
176
177 cxgbi_device_destroy(cdev);
178 }
179 EXPORT_SYMBOL_GPL(cxgbi_device_unregister);
180
181 void cxgbi_device_unregister_all(unsigned int flag)
182 {
183 struct cxgbi_device *cdev, *tmp;
184
185 mutex_lock(&cdev_mutex);
186 list_for_each_entry_safe(cdev, tmp, &cdev_list, list_head) {
187 if ((cdev->flags & flag) == flag) {
188 mutex_unlock(&cdev_mutex);
189 cxgbi_device_unregister(cdev);
190 mutex_lock(&cdev_mutex);
191 }
192 }
193 mutex_unlock(&cdev_mutex);
194 }
195 EXPORT_SYMBOL_GPL(cxgbi_device_unregister_all);
196
197 struct cxgbi_device *cxgbi_device_find_by_lldev(void *lldev)
198 {
199 struct cxgbi_device *cdev, *tmp;
200
201 mutex_lock(&cdev_mutex);
202 list_for_each_entry_safe(cdev, tmp, &cdev_list, list_head) {
203 if (cdev->lldev == lldev) {
204 mutex_unlock(&cdev_mutex);
205 return cdev;
206 }
207 }
208 mutex_unlock(&cdev_mutex);
209
210 log_debug(1 << CXGBI_DBG_DEV,
211 "lldev 0x%p, NO match found.\n", lldev);
212 return NULL;
213 }
214 EXPORT_SYMBOL_GPL(cxgbi_device_find_by_lldev);
215
216 struct cxgbi_device *cxgbi_device_find_by_netdev(struct net_device *ndev,
217 int *port)
218 {
219 struct net_device *vdev = NULL;
220 struct cxgbi_device *cdev, *tmp;
221 int i;
222
223 if (ndev->priv_flags & IFF_802_1Q_VLAN) {
224 vdev = ndev;
225 ndev = vlan_dev_real_dev(ndev);
226 log_debug(1 << CXGBI_DBG_DEV,
227 "vlan dev %s -> %s.\n", vdev->name, ndev->name);
228 }
229
230 mutex_lock(&cdev_mutex);
231 list_for_each_entry_safe(cdev, tmp, &cdev_list, list_head) {
232 for (i = 0; i < cdev->nports; i++) {
233 if (ndev == cdev->ports[i]) {
234 cdev->hbas[i]->vdev = vdev;
235 mutex_unlock(&cdev_mutex);
236 if (port)
237 *port = i;
238 return cdev;
239 }
240 }
241 }
242 mutex_unlock(&cdev_mutex);
243 log_debug(1 << CXGBI_DBG_DEV,
244 "ndev 0x%p, %s, NO match found.\n", ndev, ndev->name);
245 return NULL;
246 }
247 EXPORT_SYMBOL_GPL(cxgbi_device_find_by_netdev);
248
249 struct cxgbi_device *cxgbi_device_find_by_netdev_rcu(struct net_device *ndev,
250 int *port)
251 {
252 struct net_device *vdev = NULL;
253 struct cxgbi_device *cdev;
254 int i;
255
256 if (ndev->priv_flags & IFF_802_1Q_VLAN) {
257 vdev = ndev;
258 ndev = vlan_dev_real_dev(ndev);
259 pr_info("vlan dev %s -> %s.\n", vdev->name, ndev->name);
260 }
261
262 rcu_read_lock();
263 list_for_each_entry_rcu(cdev, &cdev_rcu_list, rcu_node) {
264 for (i = 0; i < cdev->nports; i++) {
265 if (ndev == cdev->ports[i]) {
266 cdev->hbas[i]->vdev = vdev;
267 rcu_read_unlock();
268 if (port)
269 *port = i;
270 return cdev;
271 }
272 }
273 }
274 rcu_read_unlock();
275
276 log_debug(1 << CXGBI_DBG_DEV,
277 "ndev 0x%p, %s, NO match found.\n", ndev, ndev->name);
278 return NULL;
279 }
280 EXPORT_SYMBOL_GPL(cxgbi_device_find_by_netdev_rcu);
281
282 #if IS_ENABLED(CONFIG_IPV6)
283 static struct cxgbi_device *cxgbi_device_find_by_mac(struct net_device *ndev,
284 int *port)
285 {
286 struct net_device *vdev = NULL;
287 struct cxgbi_device *cdev, *tmp;
288 int i;
289
290 if (ndev->priv_flags & IFF_802_1Q_VLAN) {
291 vdev = ndev;
292 ndev = vlan_dev_real_dev(ndev);
293 pr_info("vlan dev %s -> %s.\n", vdev->name, ndev->name);
294 }
295
296 mutex_lock(&cdev_mutex);
297 list_for_each_entry_safe(cdev, tmp, &cdev_list, list_head) {
298 for (i = 0; i < cdev->nports; i++) {
299 if (!memcmp(ndev->dev_addr, cdev->ports[i]->dev_addr,
300 MAX_ADDR_LEN)) {
301 cdev->hbas[i]->vdev = vdev;
302 mutex_unlock(&cdev_mutex);
303 if (port)
304 *port = i;
305 return cdev;
306 }
307 }
308 }
309 mutex_unlock(&cdev_mutex);
310 log_debug(1 << CXGBI_DBG_DEV,
311 "ndev 0x%p, %s, NO match mac found.\n",
312 ndev, ndev->name);
313 return NULL;
314 }
315 #endif
316
317 void cxgbi_hbas_remove(struct cxgbi_device *cdev)
318 {
319 int i;
320 struct cxgbi_hba *chba;
321
322 log_debug(1 << CXGBI_DBG_DEV,
323 "cdev 0x%p, p#%u.\n", cdev, cdev->nports);
324
325 for (i = 0; i < cdev->nports; i++) {
326 chba = cdev->hbas[i];
327 if (chba) {
328 cdev->hbas[i] = NULL;
329 iscsi_host_remove(chba->shost);
330 pci_dev_put(cdev->pdev);
331 iscsi_host_free(chba->shost);
332 }
333 }
334 }
335 EXPORT_SYMBOL_GPL(cxgbi_hbas_remove);
336
337 int cxgbi_hbas_add(struct cxgbi_device *cdev, u64 max_lun,
338 unsigned int max_id, struct scsi_host_template *sht,
339 struct scsi_transport_template *stt)
340 {
341 struct cxgbi_hba *chba;
342 struct Scsi_Host *shost;
343 int i, err;
344
345 log_debug(1 << CXGBI_DBG_DEV, "cdev 0x%p, p#%u.\n", cdev, cdev->nports);
346
347 for (i = 0; i < cdev->nports; i++) {
348 shost = iscsi_host_alloc(sht, sizeof(*chba), 1);
349 if (!shost) {
350 pr_info("0x%p, p%d, %s, host alloc failed.\n",
351 cdev, i, cdev->ports[i]->name);
352 err = -ENOMEM;
353 goto err_out;
354 }
355
356 shost->transportt = stt;
357 shost->max_lun = max_lun;
358 shost->max_id = max_id;
359 shost->max_channel = 0;
360 shost->max_cmd_len = 16;
361
362 chba = iscsi_host_priv(shost);
363 chba->cdev = cdev;
364 chba->ndev = cdev->ports[i];
365 chba->shost = shost;
366
367 log_debug(1 << CXGBI_DBG_DEV,
368 "cdev 0x%p, p#%d %s: chba 0x%p.\n",
369 cdev, i, cdev->ports[i]->name, chba);
370
371 pci_dev_get(cdev->pdev);
372 err = iscsi_host_add(shost, &cdev->pdev->dev);
373 if (err) {
374 pr_info("cdev 0x%p, p#%d %s, host add failed.\n",
375 cdev, i, cdev->ports[i]->name);
376 pci_dev_put(cdev->pdev);
377 scsi_host_put(shost);
378 goto err_out;
379 }
380
381 cdev->hbas[i] = chba;
382 }
383
384 return 0;
385
386 err_out:
387 cxgbi_hbas_remove(cdev);
388 return err;
389 }
390 EXPORT_SYMBOL_GPL(cxgbi_hbas_add);
391
392 /*
393 * iSCSI offload
394 *
395 * - source port management
396 * To find a free source port in the port allocation map we use a very simple
397 * rotor scheme to look for the next free port.
398 *
399 * If a source port has been specified make sure that it doesn't collide with
400 * our normal source port allocation map. If it's outside the range of our
401 * allocation/deallocation scheme just let them use it.
402 *
403 * If the source port is outside our allocation range, the caller is
404 * responsible for keeping track of their port usage.
405 */
406
407 static struct cxgbi_sock *find_sock_on_port(struct cxgbi_device *cdev,
408 unsigned char port_id)
409 {
410 struct cxgbi_ports_map *pmap = &cdev->pmap;
411 unsigned int i;
412 unsigned int used;
413
414 if (!pmap->max_connect || !pmap->used)
415 return NULL;
416
417 spin_lock_bh(&pmap->lock);
418 used = pmap->used;
419 for (i = 0; used && i < pmap->max_connect; i++) {
420 struct cxgbi_sock *csk = pmap->port_csk[i];
421
422 if (csk) {
423 if (csk->port_id == port_id) {
424 spin_unlock_bh(&pmap->lock);
425 return csk;
426 }
427 used--;
428 }
429 }
430 spin_unlock_bh(&pmap->lock);
431
432 return NULL;
433 }
434
435 static int sock_get_port(struct cxgbi_sock *csk)
436 {
437 struct cxgbi_device *cdev = csk->cdev;
438 struct cxgbi_ports_map *pmap = &cdev->pmap;
439 unsigned int start;
440 int idx;
441 __be16 *port;
442
443 if (!pmap->max_connect) {
444 pr_err("cdev 0x%p, p#%u %s, NO port map.\n",
445 cdev, csk->port_id, cdev->ports[csk->port_id]->name);
446 return -EADDRNOTAVAIL;
447 }
448
449 if (csk->csk_family == AF_INET)
450 port = &csk->saddr.sin_port;
451 else /* ipv6 */
452 port = &csk->saddr6.sin6_port;
453
454 if (*port) {
455 pr_err("source port NON-ZERO %u.\n",
456 ntohs(*port));
457 return -EADDRINUSE;
458 }
459
460 spin_lock_bh(&pmap->lock);
461 if (pmap->used >= pmap->max_connect) {
462 spin_unlock_bh(&pmap->lock);
463 pr_info("cdev 0x%p, p#%u %s, ALL ports used.\n",
464 cdev, csk->port_id, cdev->ports[csk->port_id]->name);
465 return -EADDRNOTAVAIL;
466 }
467
468 start = idx = pmap->next;
469 do {
470 if (++idx >= pmap->max_connect)
471 idx = 0;
472 if (!pmap->port_csk[idx]) {
473 pmap->used++;
474 *port = htons(pmap->sport_base + idx);
475 pmap->next = idx;
476 pmap->port_csk[idx] = csk;
477 spin_unlock_bh(&pmap->lock);
478 cxgbi_sock_get(csk);
479 log_debug(1 << CXGBI_DBG_SOCK,
480 "cdev 0x%p, p#%u %s, p %u, %u.\n",
481 cdev, csk->port_id,
482 cdev->ports[csk->port_id]->name,
483 pmap->sport_base + idx, pmap->next);
484 return 0;
485 }
486 } while (idx != start);
487 spin_unlock_bh(&pmap->lock);
488
489 /* should not happen */
490 pr_warn("cdev 0x%p, p#%u %s, next %u?\n",
491 cdev, csk->port_id, cdev->ports[csk->port_id]->name,
492 pmap->next);
493 return -EADDRNOTAVAIL;
494 }
495
496 static void sock_put_port(struct cxgbi_sock *csk)
497 {
498 struct cxgbi_device *cdev = csk->cdev;
499 struct cxgbi_ports_map *pmap = &cdev->pmap;
500 __be16 *port;
501
502 if (csk->csk_family == AF_INET)
503 port = &csk->saddr.sin_port;
504 else /* ipv6 */
505 port = &csk->saddr6.sin6_port;
506
507 if (*port) {
508 int idx = ntohs(*port) - pmap->sport_base;
509
510 *port = 0;
511 if (idx < 0 || idx >= pmap->max_connect) {
512 pr_err("cdev 0x%p, p#%u %s, port %u OOR.\n",
513 cdev, csk->port_id,
514 cdev->ports[csk->port_id]->name,
515 ntohs(*port));
516 return;
517 }
518
519 spin_lock_bh(&pmap->lock);
520 pmap->port_csk[idx] = NULL;
521 pmap->used--;
522 spin_unlock_bh(&pmap->lock);
523
524 log_debug(1 << CXGBI_DBG_SOCK,
525 "cdev 0x%p, p#%u %s, release %u.\n",
526 cdev, csk->port_id, cdev->ports[csk->port_id]->name,
527 pmap->sport_base + idx);
528
529 cxgbi_sock_put(csk);
530 }
531 }
532
533 /*
534 * iscsi tcp connection
535 */
536 void cxgbi_sock_free_cpl_skbs(struct cxgbi_sock *csk)
537 {
538 if (csk->cpl_close) {
539 kfree_skb(csk->cpl_close);
540 csk->cpl_close = NULL;
541 }
542 if (csk->cpl_abort_req) {
543 kfree_skb(csk->cpl_abort_req);
544 csk->cpl_abort_req = NULL;
545 }
546 if (csk->cpl_abort_rpl) {
547 kfree_skb(csk->cpl_abort_rpl);
548 csk->cpl_abort_rpl = NULL;
549 }
550 }
551 EXPORT_SYMBOL_GPL(cxgbi_sock_free_cpl_skbs);
552
553 static struct cxgbi_sock *cxgbi_sock_create(struct cxgbi_device *cdev)
554 {
555 struct cxgbi_sock *csk = kzalloc(sizeof(*csk), GFP_NOIO);
556
557 if (!csk) {
558 pr_info("alloc csk %zu failed.\n", sizeof(*csk));
559 return NULL;
560 }
561
562 if (cdev->csk_alloc_cpls(csk) < 0) {
563 pr_info("csk 0x%p, alloc cpls failed.\n", csk);
564 kfree(csk);
565 return NULL;
566 }
567
568 spin_lock_init(&csk->lock);
569 kref_init(&csk->refcnt);
570 skb_queue_head_init(&csk->receive_queue);
571 skb_queue_head_init(&csk->write_queue);
572 setup_timer(&csk->retry_timer, NULL, (unsigned long)csk);
573 rwlock_init(&csk->callback_lock);
574 csk->cdev = cdev;
575 csk->flags = 0;
576 cxgbi_sock_set_state(csk, CTP_CLOSED);
577
578 log_debug(1 << CXGBI_DBG_SOCK, "cdev 0x%p, new csk 0x%p.\n", cdev, csk);
579
580 return csk;
581 }
582
583 static struct rtable *find_route_ipv4(struct flowi4 *fl4,
584 __be32 saddr, __be32 daddr,
585 __be16 sport, __be16 dport, u8 tos)
586 {
587 struct rtable *rt;
588
589 rt = ip_route_output_ports(&init_net, fl4, NULL, daddr, saddr,
590 dport, sport, IPPROTO_TCP, tos, 0);
591 if (IS_ERR(rt))
592 return NULL;
593
594 return rt;
595 }
596
597 static struct cxgbi_sock *cxgbi_check_route(struct sockaddr *dst_addr)
598 {
599 struct sockaddr_in *daddr = (struct sockaddr_in *)dst_addr;
600 struct dst_entry *dst;
601 struct net_device *ndev;
602 struct cxgbi_device *cdev;
603 struct rtable *rt = NULL;
604 struct neighbour *n;
605 struct flowi4 fl4;
606 struct cxgbi_sock *csk = NULL;
607 unsigned int mtu = 0;
608 int port = 0xFFFF;
609 int err = 0;
610
611 rt = find_route_ipv4(&fl4, 0, daddr->sin_addr.s_addr, 0, daddr->sin_port, 0);
612 if (!rt) {
613 pr_info("no route to ipv4 0x%x, port %u.\n",
614 be32_to_cpu(daddr->sin_addr.s_addr),
615 be16_to_cpu(daddr->sin_port));
616 err = -ENETUNREACH;
617 goto err_out;
618 }
619 dst = &rt->dst;
620 n = dst_neigh_lookup(dst, &daddr->sin_addr.s_addr);
621 if (!n) {
622 err = -ENODEV;
623 goto rel_rt;
624 }
625 ndev = n->dev;
626
627 if (rt->rt_flags & (RTCF_MULTICAST | RTCF_BROADCAST)) {
628 pr_info("multi-cast route %pI4, port %u, dev %s.\n",
629 &daddr->sin_addr.s_addr, ntohs(daddr->sin_port),
630 ndev->name);
631 err = -ENETUNREACH;
632 goto rel_neigh;
633 }
634
635 if (ndev->flags & IFF_LOOPBACK) {
636 ndev = ip_dev_find(&init_net, daddr->sin_addr.s_addr);
637 mtu = ndev->mtu;
638 pr_info("rt dev %s, loopback -> %s, mtu %u.\n",
639 n->dev->name, ndev->name, mtu);
640 }
641
642 cdev = cxgbi_device_find_by_netdev(ndev, &port);
643 if (!cdev) {
644 pr_info("dst %pI4, %s, NOT cxgbi device.\n",
645 &daddr->sin_addr.s_addr, ndev->name);
646 err = -ENETUNREACH;
647 goto rel_neigh;
648 }
649 log_debug(1 << CXGBI_DBG_SOCK,
650 "route to %pI4 :%u, ndev p#%d,%s, cdev 0x%p.\n",
651 &daddr->sin_addr.s_addr, ntohs(daddr->sin_port),
652 port, ndev->name, cdev);
653
654 csk = cxgbi_sock_create(cdev);
655 if (!csk) {
656 err = -ENOMEM;
657 goto rel_neigh;
658 }
659 csk->cdev = cdev;
660 csk->port_id = port;
661 csk->mtu = mtu;
662 csk->dst = dst;
663
664 csk->csk_family = AF_INET;
665 csk->daddr.sin_addr.s_addr = daddr->sin_addr.s_addr;
666 csk->daddr.sin_port = daddr->sin_port;
667 csk->daddr.sin_family = daddr->sin_family;
668 csk->saddr.sin_family = daddr->sin_family;
669 csk->saddr.sin_addr.s_addr = fl4.saddr;
670 neigh_release(n);
671
672 return csk;
673
674 rel_neigh:
675 neigh_release(n);
676
677 rel_rt:
678 ip_rt_put(rt);
679 if (csk)
680 cxgbi_sock_closed(csk);
681 err_out:
682 return ERR_PTR(err);
683 }
684
685 #if IS_ENABLED(CONFIG_IPV6)
686 static struct rt6_info *find_route_ipv6(const struct in6_addr *saddr,
687 const struct in6_addr *daddr)
688 {
689 struct flowi6 fl;
690
691 if (saddr)
692 memcpy(&fl.saddr, saddr, sizeof(struct in6_addr));
693 if (daddr)
694 memcpy(&fl.daddr, daddr, sizeof(struct in6_addr));
695 return (struct rt6_info *)ip6_route_output(&init_net, NULL, &fl);
696 }
697
698 static struct cxgbi_sock *cxgbi_check_route6(struct sockaddr *dst_addr)
699 {
700 struct sockaddr_in6 *daddr6 = (struct sockaddr_in6 *)dst_addr;
701 struct dst_entry *dst;
702 struct net_device *ndev;
703 struct cxgbi_device *cdev;
704 struct rt6_info *rt = NULL;
705 struct neighbour *n;
706 struct in6_addr pref_saddr;
707 struct cxgbi_sock *csk = NULL;
708 unsigned int mtu = 0;
709 int port = 0xFFFF;
710 int err = 0;
711
712 rt = find_route_ipv6(NULL, &daddr6->sin6_addr);
713
714 if (!rt) {
715 pr_info("no route to ipv6 %pI6 port %u\n",
716 daddr6->sin6_addr.s6_addr,
717 be16_to_cpu(daddr6->sin6_port));
718 err = -ENETUNREACH;
719 goto err_out;
720 }
721
722 dst = &rt->dst;
723
724 n = dst_neigh_lookup(dst, &daddr6->sin6_addr);
725
726 if (!n) {
727 pr_info("%pI6, port %u, dst no neighbour.\n",
728 daddr6->sin6_addr.s6_addr,
729 be16_to_cpu(daddr6->sin6_port));
730 err = -ENETUNREACH;
731 goto rel_rt;
732 }
733 ndev = n->dev;
734
735 if (ipv6_addr_is_multicast(&daddr6->sin6_addr)) {
736 pr_info("multi-cast route %pI6 port %u, dev %s.\n",
737 daddr6->sin6_addr.s6_addr,
738 ntohs(daddr6->sin6_port), ndev->name);
739 err = -ENETUNREACH;
740 goto rel_rt;
741 }
742
743 cdev = cxgbi_device_find_by_netdev(ndev, &port);
744 if (!cdev)
745 cdev = cxgbi_device_find_by_mac(ndev, &port);
746 if (!cdev) {
747 pr_info("dst %pI6 %s, NOT cxgbi device.\n",
748 daddr6->sin6_addr.s6_addr, ndev->name);
749 err = -ENETUNREACH;
750 goto rel_rt;
751 }
752 log_debug(1 << CXGBI_DBG_SOCK,
753 "route to %pI6 :%u, ndev p#%d,%s, cdev 0x%p.\n",
754 daddr6->sin6_addr.s6_addr, ntohs(daddr6->sin6_port), port,
755 ndev->name, cdev);
756
757 csk = cxgbi_sock_create(cdev);
758 if (!csk) {
759 err = -ENOMEM;
760 goto rel_rt;
761 }
762 csk->cdev = cdev;
763 csk->port_id = port;
764 csk->mtu = mtu;
765 csk->dst = dst;
766
767 if (ipv6_addr_any(&rt->rt6i_prefsrc.addr)) {
768 struct inet6_dev *idev = ip6_dst_idev((struct dst_entry *)rt);
769
770 err = ipv6_dev_get_saddr(&init_net, idev ? idev->dev : NULL,
771 &daddr6->sin6_addr, 0, &pref_saddr);
772 if (err) {
773 pr_info("failed to get source address to reach %pI6\n",
774 &daddr6->sin6_addr);
775 goto rel_rt;
776 }
777 } else {
778 pref_saddr = rt->rt6i_prefsrc.addr;
779 }
780
781 csk->csk_family = AF_INET6;
782 csk->daddr6.sin6_addr = daddr6->sin6_addr;
783 csk->daddr6.sin6_port = daddr6->sin6_port;
784 csk->daddr6.sin6_family = daddr6->sin6_family;
785 csk->saddr6.sin6_family = daddr6->sin6_family;
786 csk->saddr6.sin6_addr = pref_saddr;
787
788 neigh_release(n);
789 return csk;
790
791 rel_rt:
792 if (n)
793 neigh_release(n);
794
795 ip6_rt_put(rt);
796 if (csk)
797 cxgbi_sock_closed(csk);
798 err_out:
799 return ERR_PTR(err);
800 }
801 #endif /* IS_ENABLED(CONFIG_IPV6) */
802
803 void cxgbi_sock_established(struct cxgbi_sock *csk, unsigned int snd_isn,
804 unsigned int opt)
805 {
806 csk->write_seq = csk->snd_nxt = csk->snd_una = snd_isn;
807 dst_confirm(csk->dst);
808 smp_mb();
809 cxgbi_sock_set_state(csk, CTP_ESTABLISHED);
810 }
811 EXPORT_SYMBOL_GPL(cxgbi_sock_established);
812
813 static void cxgbi_inform_iscsi_conn_closing(struct cxgbi_sock *csk)
814 {
815 log_debug(1 << CXGBI_DBG_SOCK,
816 "csk 0x%p, state %u, flags 0x%lx, conn 0x%p.\n",
817 csk, csk->state, csk->flags, csk->user_data);
818
819 if (csk->state != CTP_ESTABLISHED) {
820 read_lock_bh(&csk->callback_lock);
821 if (csk->user_data)
822 iscsi_conn_failure(csk->user_data,
823 ISCSI_ERR_TCP_CONN_CLOSE);
824 read_unlock_bh(&csk->callback_lock);
825 }
826 }
827
828 void cxgbi_sock_closed(struct cxgbi_sock *csk)
829 {
830 log_debug(1 << CXGBI_DBG_SOCK, "csk 0x%p,%u,0x%lx,%u.\n",
831 csk, (csk)->state, (csk)->flags, (csk)->tid);
832 cxgbi_sock_set_flag(csk, CTPF_ACTIVE_CLOSE_NEEDED);
833 if (csk->state == CTP_ACTIVE_OPEN || csk->state == CTP_CLOSED)
834 return;
835 if (csk->saddr.sin_port)
836 sock_put_port(csk);
837 if (csk->dst)
838 dst_release(csk->dst);
839 csk->cdev->csk_release_offload_resources(csk);
840 cxgbi_sock_set_state(csk, CTP_CLOSED);
841 cxgbi_inform_iscsi_conn_closing(csk);
842 cxgbi_sock_put(csk);
843 }
844 EXPORT_SYMBOL_GPL(cxgbi_sock_closed);
845
846 static void need_active_close(struct cxgbi_sock *csk)
847 {
848 int data_lost;
849 int close_req = 0;
850
851 log_debug(1 << CXGBI_DBG_SOCK, "csk 0x%p,%u,0x%lx,%u.\n",
852 csk, (csk)->state, (csk)->flags, (csk)->tid);
853 spin_lock_bh(&csk->lock);
854 dst_confirm(csk->dst);
855 data_lost = skb_queue_len(&csk->receive_queue);
856 __skb_queue_purge(&csk->receive_queue);
857
858 if (csk->state == CTP_ACTIVE_OPEN)
859 cxgbi_sock_set_flag(csk, CTPF_ACTIVE_CLOSE_NEEDED);
860 else if (csk->state == CTP_ESTABLISHED) {
861 close_req = 1;
862 cxgbi_sock_set_state(csk, CTP_ACTIVE_CLOSE);
863 } else if (csk->state == CTP_PASSIVE_CLOSE) {
864 close_req = 1;
865 cxgbi_sock_set_state(csk, CTP_CLOSE_WAIT_2);
866 }
867
868 if (close_req) {
869 if (data_lost)
870 csk->cdev->csk_send_abort_req(csk);
871 else
872 csk->cdev->csk_send_close_req(csk);
873 }
874
875 spin_unlock_bh(&csk->lock);
876 }
877
878 void cxgbi_sock_fail_act_open(struct cxgbi_sock *csk, int errno)
879 {
880 pr_info("csk 0x%p,%u,%lx, %pI4:%u-%pI4:%u, err %d.\n",
881 csk, csk->state, csk->flags,
882 &csk->saddr.sin_addr.s_addr, csk->saddr.sin_port,
883 &csk->daddr.sin_addr.s_addr, csk->daddr.sin_port,
884 errno);
885
886 cxgbi_sock_set_state(csk, CTP_CONNECTING);
887 csk->err = errno;
888 cxgbi_sock_closed(csk);
889 }
890 EXPORT_SYMBOL_GPL(cxgbi_sock_fail_act_open);
891
892 void cxgbi_sock_act_open_req_arp_failure(void *handle, struct sk_buff *skb)
893 {
894 struct cxgbi_sock *csk = (struct cxgbi_sock *)skb->sk;
895
896 log_debug(1 << CXGBI_DBG_SOCK, "csk 0x%p,%u,0x%lx,%u.\n",
897 csk, (csk)->state, (csk)->flags, (csk)->tid);
898 cxgbi_sock_get(csk);
899 spin_lock_bh(&csk->lock);
900 if (csk->state == CTP_ACTIVE_OPEN)
901 cxgbi_sock_fail_act_open(csk, -EHOSTUNREACH);
902 spin_unlock_bh(&csk->lock);
903 cxgbi_sock_put(csk);
904 __kfree_skb(skb);
905 }
906 EXPORT_SYMBOL_GPL(cxgbi_sock_act_open_req_arp_failure);
907
908 void cxgbi_sock_rcv_abort_rpl(struct cxgbi_sock *csk)
909 {
910 cxgbi_sock_get(csk);
911 spin_lock_bh(&csk->lock);
912
913 cxgbi_sock_set_flag(csk, CTPF_ABORT_RPL_RCVD);
914 if (cxgbi_sock_flag(csk, CTPF_ABORT_RPL_PENDING)) {
915 cxgbi_sock_clear_flag(csk, CTPF_ABORT_RPL_PENDING);
916 if (cxgbi_sock_flag(csk, CTPF_ABORT_REQ_RCVD))
917 pr_err("csk 0x%p,%u,0x%lx,%u,ABT_RPL_RSS.\n",
918 csk, csk->state, csk->flags, csk->tid);
919 cxgbi_sock_closed(csk);
920 }
921
922 spin_unlock_bh(&csk->lock);
923 cxgbi_sock_put(csk);
924 }
925 EXPORT_SYMBOL_GPL(cxgbi_sock_rcv_abort_rpl);
926
927 void cxgbi_sock_rcv_peer_close(struct cxgbi_sock *csk)
928 {
929 log_debug(1 << CXGBI_DBG_SOCK, "csk 0x%p,%u,0x%lx,%u.\n",
930 csk, (csk)->state, (csk)->flags, (csk)->tid);
931 cxgbi_sock_get(csk);
932 spin_lock_bh(&csk->lock);
933
934 if (cxgbi_sock_flag(csk, CTPF_ABORT_RPL_PENDING))
935 goto done;
936
937 switch (csk->state) {
938 case CTP_ESTABLISHED:
939 cxgbi_sock_set_state(csk, CTP_PASSIVE_CLOSE);
940 break;
941 case CTP_ACTIVE_CLOSE:
942 cxgbi_sock_set_state(csk, CTP_CLOSE_WAIT_2);
943 break;
944 case CTP_CLOSE_WAIT_1:
945 cxgbi_sock_closed(csk);
946 break;
947 case CTP_ABORTING:
948 break;
949 default:
950 pr_err("csk 0x%p,%u,0x%lx,%u, bad state.\n",
951 csk, csk->state, csk->flags, csk->tid);
952 }
953 cxgbi_inform_iscsi_conn_closing(csk);
954 done:
955 spin_unlock_bh(&csk->lock);
956 cxgbi_sock_put(csk);
957 }
958 EXPORT_SYMBOL_GPL(cxgbi_sock_rcv_peer_close);
959
960 void cxgbi_sock_rcv_close_conn_rpl(struct cxgbi_sock *csk, u32 snd_nxt)
961 {
962 log_debug(1 << CXGBI_DBG_SOCK, "csk 0x%p,%u,0x%lx,%u.\n",
963 csk, (csk)->state, (csk)->flags, (csk)->tid);
964 cxgbi_sock_get(csk);
965 spin_lock_bh(&csk->lock);
966
967 csk->snd_una = snd_nxt - 1;
968 if (cxgbi_sock_flag(csk, CTPF_ABORT_RPL_PENDING))
969 goto done;
970
971 switch (csk->state) {
972 case CTP_ACTIVE_CLOSE:
973 cxgbi_sock_set_state(csk, CTP_CLOSE_WAIT_1);
974 break;
975 case CTP_CLOSE_WAIT_1:
976 case CTP_CLOSE_WAIT_2:
977 cxgbi_sock_closed(csk);
978 break;
979 case CTP_ABORTING:
980 break;
981 default:
982 pr_err("csk 0x%p,%u,0x%lx,%u, bad state.\n",
983 csk, csk->state, csk->flags, csk->tid);
984 }
985 done:
986 spin_unlock_bh(&csk->lock);
987 cxgbi_sock_put(csk);
988 }
989 EXPORT_SYMBOL_GPL(cxgbi_sock_rcv_close_conn_rpl);
990
991 void cxgbi_sock_rcv_wr_ack(struct cxgbi_sock *csk, unsigned int credits,
992 unsigned int snd_una, int seq_chk)
993 {
994 log_debug(1 << CXGBI_DBG_TOE | 1 << CXGBI_DBG_SOCK,
995 "csk 0x%p,%u,0x%lx,%u, cr %u,%u+%u, snd_una %u,%d.\n",
996 csk, csk->state, csk->flags, csk->tid, credits,
997 csk->wr_cred, csk->wr_una_cred, snd_una, seq_chk);
998
999 spin_lock_bh(&csk->lock);
1000
1001 csk->wr_cred += credits;
1002 if (csk->wr_una_cred > csk->wr_max_cred - csk->wr_cred)
1003 csk->wr_una_cred = csk->wr_max_cred - csk->wr_cred;
1004
1005 while (credits) {
1006 struct sk_buff *p = cxgbi_sock_peek_wr(csk);
1007
1008 if (unlikely(!p)) {
1009 pr_err("csk 0x%p,%u,0x%lx,%u, cr %u,%u+%u, empty.\n",
1010 csk, csk->state, csk->flags, csk->tid, credits,
1011 csk->wr_cred, csk->wr_una_cred);
1012 break;
1013 }
1014
1015 if (unlikely(credits < p->csum)) {
1016 pr_warn("csk 0x%p,%u,0x%lx,%u, cr %u,%u+%u, < %u.\n",
1017 csk, csk->state, csk->flags, csk->tid,
1018 credits, csk->wr_cred, csk->wr_una_cred,
1019 p->csum);
1020 p->csum -= credits;
1021 break;
1022 } else {
1023 cxgbi_sock_dequeue_wr(csk);
1024 credits -= p->csum;
1025 kfree_skb(p);
1026 }
1027 }
1028
1029 cxgbi_sock_check_wr_invariants(csk);
1030
1031 if (seq_chk) {
1032 if (unlikely(before(snd_una, csk->snd_una))) {
1033 pr_warn("csk 0x%p,%u,0x%lx,%u, snd_una %u/%u.",
1034 csk, csk->state, csk->flags, csk->tid, snd_una,
1035 csk->snd_una);
1036 goto done;
1037 }
1038
1039 if (csk->snd_una != snd_una) {
1040 csk->snd_una = snd_una;
1041 dst_confirm(csk->dst);
1042 }
1043 }
1044
1045 if (skb_queue_len(&csk->write_queue)) {
1046 if (csk->cdev->csk_push_tx_frames(csk, 0))
1047 cxgbi_conn_tx_open(csk);
1048 } else
1049 cxgbi_conn_tx_open(csk);
1050 done:
1051 spin_unlock_bh(&csk->lock);
1052 }
1053 EXPORT_SYMBOL_GPL(cxgbi_sock_rcv_wr_ack);
1054
1055 static unsigned int cxgbi_sock_find_best_mtu(struct cxgbi_sock *csk,
1056 unsigned short mtu)
1057 {
1058 int i = 0;
1059
1060 while (i < csk->cdev->nmtus - 1 && csk->cdev->mtus[i + 1] <= mtu)
1061 ++i;
1062
1063 return i;
1064 }
1065
1066 unsigned int cxgbi_sock_select_mss(struct cxgbi_sock *csk, unsigned int pmtu)
1067 {
1068 unsigned int idx;
1069 struct dst_entry *dst = csk->dst;
1070
1071 csk->advmss = dst_metric_advmss(dst);
1072
1073 if (csk->advmss > pmtu - 40)
1074 csk->advmss = pmtu - 40;
1075 if (csk->advmss < csk->cdev->mtus[0] - 40)
1076 csk->advmss = csk->cdev->mtus[0] - 40;
1077 idx = cxgbi_sock_find_best_mtu(csk, csk->advmss + 40);
1078
1079 return idx;
1080 }
1081 EXPORT_SYMBOL_GPL(cxgbi_sock_select_mss);
1082
1083 void cxgbi_sock_skb_entail(struct cxgbi_sock *csk, struct sk_buff *skb)
1084 {
1085 cxgbi_skcb_tcp_seq(skb) = csk->write_seq;
1086 __skb_queue_tail(&csk->write_queue, skb);
1087 }
1088 EXPORT_SYMBOL_GPL(cxgbi_sock_skb_entail);
1089
1090 void cxgbi_sock_purge_wr_queue(struct cxgbi_sock *csk)
1091 {
1092 struct sk_buff *skb;
1093
1094 while ((skb = cxgbi_sock_dequeue_wr(csk)) != NULL)
1095 kfree_skb(skb);
1096 }
1097 EXPORT_SYMBOL_GPL(cxgbi_sock_purge_wr_queue);
1098
1099 void cxgbi_sock_check_wr_invariants(const struct cxgbi_sock *csk)
1100 {
1101 int pending = cxgbi_sock_count_pending_wrs(csk);
1102
1103 if (unlikely(csk->wr_cred + pending != csk->wr_max_cred))
1104 pr_err("csk 0x%p, tid %u, credit %u + %u != %u.\n",
1105 csk, csk->tid, csk->wr_cred, pending, csk->wr_max_cred);
1106 }
1107 EXPORT_SYMBOL_GPL(cxgbi_sock_check_wr_invariants);
1108
1109 static int cxgbi_sock_send_pdus(struct cxgbi_sock *csk, struct sk_buff *skb)
1110 {
1111 struct cxgbi_device *cdev = csk->cdev;
1112 struct sk_buff *next;
1113 int err, copied = 0;
1114
1115 spin_lock_bh(&csk->lock);
1116
1117 if (csk->state != CTP_ESTABLISHED) {
1118 log_debug(1 << CXGBI_DBG_PDU_TX,
1119 "csk 0x%p,%u,0x%lx,%u, EAGAIN.\n",
1120 csk, csk->state, csk->flags, csk->tid);
1121 err = -EAGAIN;
1122 goto out_err;
1123 }
1124
1125 if (csk->err) {
1126 log_debug(1 << CXGBI_DBG_PDU_TX,
1127 "csk 0x%p,%u,0x%lx,%u, EPIPE %d.\n",
1128 csk, csk->state, csk->flags, csk->tid, csk->err);
1129 err = -EPIPE;
1130 goto out_err;
1131 }
1132
1133 if (csk->write_seq - csk->snd_una >= csk->snd_win) {
1134 log_debug(1 << CXGBI_DBG_PDU_TX,
1135 "csk 0x%p,%u,0x%lx,%u, FULL %u-%u >= %u.\n",
1136 csk, csk->state, csk->flags, csk->tid, csk->write_seq,
1137 csk->snd_una, csk->snd_win);
1138 err = -ENOBUFS;
1139 goto out_err;
1140 }
1141
1142 while (skb) {
1143 int frags = skb_shinfo(skb)->nr_frags +
1144 (skb->len != skb->data_len);
1145
1146 if (unlikely(skb_headroom(skb) < cdev->skb_tx_rsvd)) {
1147 pr_err("csk 0x%p, skb head %u < %u.\n",
1148 csk, skb_headroom(skb), cdev->skb_tx_rsvd);
1149 err = -EINVAL;
1150 goto out_err;
1151 }
1152
1153 if (frags >= SKB_WR_LIST_SIZE) {
1154 pr_err("csk 0x%p, frags %d, %u,%u >%u.\n",
1155 csk, skb_shinfo(skb)->nr_frags, skb->len,
1156 skb->data_len, (uint)(SKB_WR_LIST_SIZE));
1157 err = -EINVAL;
1158 goto out_err;
1159 }
1160
1161 next = skb->next;
1162 skb->next = NULL;
1163 cxgbi_skcb_set_flag(skb, SKCBF_TX_NEED_HDR);
1164 cxgbi_sock_skb_entail(csk, skb);
1165 copied += skb->len;
1166 csk->write_seq += skb->len +
1167 cxgbi_ulp_extra_len(cxgbi_skcb_ulp_mode(skb));
1168 skb = next;
1169 }
1170 done:
1171 if (likely(skb_queue_len(&csk->write_queue)))
1172 cdev->csk_push_tx_frames(csk, 1);
1173 spin_unlock_bh(&csk->lock);
1174 return copied;
1175
1176 out_err:
1177 if (copied == 0 && err == -EPIPE)
1178 copied = csk->err ? csk->err : -EPIPE;
1179 else
1180 copied = err;
1181 goto done;
1182 }
1183
1184 /*
1185 * Direct Data Placement -
1186 * Directly place the iSCSI Data-In or Data-Out PDU's payload into pre-posted
1187 * final destination host-memory buffers based on the Initiator Task Tag (ITT)
1188 * in Data-In or Target Task Tag (TTT) in Data-Out PDUs.
1189 * The host memory address is programmed into h/w in the format of pagepod
1190 * entries.
1191 * The location of the pagepod entry is encoded into ddp tag which is used as
1192 * the base for ITT/TTT.
1193 */
1194
1195 static unsigned char ddp_page_order[DDP_PGIDX_MAX] = {0, 1, 2, 4};
1196 static unsigned char ddp_page_shift[DDP_PGIDX_MAX] = {12, 13, 14, 16};
1197 static unsigned char page_idx = DDP_PGIDX_MAX;
1198
1199 static unsigned char sw_tag_idx_bits;
1200 static unsigned char sw_tag_age_bits;
1201
1202 /*
1203 * Direct-Data Placement page size adjustment
1204 */
1205 static int ddp_adjust_page_table(void)
1206 {
1207 int i;
1208 unsigned int base_order, order;
1209
1210 if (PAGE_SIZE < (1UL << ddp_page_shift[0])) {
1211 pr_info("PAGE_SIZE 0x%lx too small, min 0x%lx\n",
1212 PAGE_SIZE, 1UL << ddp_page_shift[0]);
1213 return -EINVAL;
1214 }
1215
1216 base_order = get_order(1UL << ddp_page_shift[0]);
1217 order = get_order(1UL << PAGE_SHIFT);
1218
1219 for (i = 0; i < DDP_PGIDX_MAX; i++) {
1220 /* first is the kernel page size, then just doubling */
1221 ddp_page_order[i] = order - base_order + i;
1222 ddp_page_shift[i] = PAGE_SHIFT + i;
1223 }
1224 return 0;
1225 }
1226
1227 static int ddp_find_page_index(unsigned long pgsz)
1228 {
1229 int i;
1230
1231 for (i = 0; i < DDP_PGIDX_MAX; i++) {
1232 if (pgsz == (1UL << ddp_page_shift[i]))
1233 return i;
1234 }
1235 pr_info("ddp page size %lu not supported.\n", pgsz);
1236 return DDP_PGIDX_MAX;
1237 }
1238
1239 static void ddp_setup_host_page_size(void)
1240 {
1241 if (page_idx == DDP_PGIDX_MAX) {
1242 page_idx = ddp_find_page_index(PAGE_SIZE);
1243
1244 if (page_idx == DDP_PGIDX_MAX) {
1245 pr_info("system PAGE %lu, update hw.\n", PAGE_SIZE);
1246 if (ddp_adjust_page_table() < 0) {
1247 pr_info("PAGE %lu, disable ddp.\n", PAGE_SIZE);
1248 return;
1249 }
1250 page_idx = ddp_find_page_index(PAGE_SIZE);
1251 }
1252 pr_info("system PAGE %lu, ddp idx %u.\n", PAGE_SIZE, page_idx);
1253 }
1254 }
1255
1256 void cxgbi_ddp_page_size_factor(int *pgsz_factor)
1257 {
1258 int i;
1259
1260 for (i = 0; i < DDP_PGIDX_MAX; i++)
1261 pgsz_factor[i] = ddp_page_order[i];
1262 }
1263 EXPORT_SYMBOL_GPL(cxgbi_ddp_page_size_factor);
1264
1265 /*
1266 * DDP setup & teardown
1267 */
1268
1269 void cxgbi_ddp_ppod_set(struct cxgbi_pagepod *ppod,
1270 struct cxgbi_pagepod_hdr *hdr,
1271 struct cxgbi_gather_list *gl, unsigned int gidx)
1272 {
1273 int i;
1274
1275 memcpy(ppod, hdr, sizeof(*hdr));
1276 for (i = 0; i < (PPOD_PAGES_MAX + 1); i++, gidx++) {
1277 ppod->addr[i] = gidx < gl->nelem ?
1278 cpu_to_be64(gl->phys_addr[gidx]) : 0ULL;
1279 }
1280 }
1281 EXPORT_SYMBOL_GPL(cxgbi_ddp_ppod_set);
1282
1283 void cxgbi_ddp_ppod_clear(struct cxgbi_pagepod *ppod)
1284 {
1285 memset(ppod, 0, sizeof(*ppod));
1286 }
1287 EXPORT_SYMBOL_GPL(cxgbi_ddp_ppod_clear);
1288
1289 static inline int ddp_find_unused_entries(struct cxgbi_ddp_info *ddp,
1290 unsigned int start, unsigned int max,
1291 unsigned int count,
1292 struct cxgbi_gather_list *gl)
1293 {
1294 unsigned int i, j, k;
1295
1296 /* not enough entries */
1297 if ((max - start) < count) {
1298 log_debug(1 << CXGBI_DBG_DDP,
1299 "NOT enough entries %u+%u < %u.\n", start, count, max);
1300 return -EBUSY;
1301 }
1302
1303 max -= count;
1304 spin_lock(&ddp->map_lock);
1305 for (i = start; i < max;) {
1306 for (j = 0, k = i; j < count; j++, k++) {
1307 if (ddp->gl_map[k])
1308 break;
1309 }
1310 if (j == count) {
1311 for (j = 0, k = i; j < count; j++, k++)
1312 ddp->gl_map[k] = gl;
1313 spin_unlock(&ddp->map_lock);
1314 return i;
1315 }
1316 i += j + 1;
1317 }
1318 spin_unlock(&ddp->map_lock);
1319 log_debug(1 << CXGBI_DBG_DDP,
1320 "NO suitable entries %u available.\n", count);
1321 return -EBUSY;
1322 }
1323
1324 static inline void ddp_unmark_entries(struct cxgbi_ddp_info *ddp,
1325 int start, int count)
1326 {
1327 spin_lock(&ddp->map_lock);
1328 memset(&ddp->gl_map[start], 0,
1329 count * sizeof(struct cxgbi_gather_list *));
1330 spin_unlock(&ddp->map_lock);
1331 }
1332
1333 static inline void ddp_gl_unmap(struct pci_dev *pdev,
1334 struct cxgbi_gather_list *gl)
1335 {
1336 int i;
1337
1338 for (i = 0; i < gl->nelem; i++)
1339 dma_unmap_page(&pdev->dev, gl->phys_addr[i], PAGE_SIZE,
1340 PCI_DMA_FROMDEVICE);
1341 }
1342
1343 static inline int ddp_gl_map(struct pci_dev *pdev,
1344 struct cxgbi_gather_list *gl)
1345 {
1346 int i;
1347
1348 for (i = 0; i < gl->nelem; i++) {
1349 gl->phys_addr[i] = dma_map_page(&pdev->dev, gl->pages[i], 0,
1350 PAGE_SIZE,
1351 PCI_DMA_FROMDEVICE);
1352 if (unlikely(dma_mapping_error(&pdev->dev, gl->phys_addr[i]))) {
1353 log_debug(1 << CXGBI_DBG_DDP,
1354 "page %d 0x%p, 0x%p dma mapping err.\n",
1355 i, gl->pages[i], pdev);
1356 goto unmap;
1357 }
1358 }
1359 return i;
1360 unmap:
1361 if (i) {
1362 unsigned int nelem = gl->nelem;
1363
1364 gl->nelem = i;
1365 ddp_gl_unmap(pdev, gl);
1366 gl->nelem = nelem;
1367 }
1368 return -EINVAL;
1369 }
1370
1371 static void ddp_release_gl(struct cxgbi_gather_list *gl,
1372 struct pci_dev *pdev)
1373 {
1374 ddp_gl_unmap(pdev, gl);
1375 kfree(gl);
1376 }
1377
1378 static struct cxgbi_gather_list *ddp_make_gl(unsigned int xferlen,
1379 struct scatterlist *sgl,
1380 unsigned int sgcnt,
1381 struct pci_dev *pdev,
1382 gfp_t gfp)
1383 {
1384 struct cxgbi_gather_list *gl;
1385 struct scatterlist *sg = sgl;
1386 struct page *sgpage = sg_page(sg);
1387 unsigned int sglen = sg->length;
1388 unsigned int sgoffset = sg->offset;
1389 unsigned int npages = (xferlen + sgoffset + PAGE_SIZE - 1) >>
1390 PAGE_SHIFT;
1391 int i = 1, j = 0;
1392
1393 if (xferlen < DDP_THRESHOLD) {
1394 log_debug(1 << CXGBI_DBG_DDP,
1395 "xfer %u < threshold %u, no ddp.\n",
1396 xferlen, DDP_THRESHOLD);
1397 return NULL;
1398 }
1399
1400 gl = kzalloc(sizeof(struct cxgbi_gather_list) +
1401 npages * (sizeof(dma_addr_t) +
1402 sizeof(struct page *)), gfp);
1403 if (!gl) {
1404 log_debug(1 << CXGBI_DBG_DDP,
1405 "xfer %u, %u pages, OOM.\n", xferlen, npages);
1406 return NULL;
1407 }
1408
1409 log_debug(1 << CXGBI_DBG_DDP,
1410 "xfer %u, sgl %u, gl max %u.\n", xferlen, sgcnt, npages);
1411
1412 gl->pages = (struct page **)&gl->phys_addr[npages];
1413 gl->nelem = npages;
1414 gl->length = xferlen;
1415 gl->offset = sgoffset;
1416 gl->pages[0] = sgpage;
1417
1418 for (i = 1, sg = sg_next(sgl), j = 0; i < sgcnt;
1419 i++, sg = sg_next(sg)) {
1420 struct page *page = sg_page(sg);
1421
1422 if (sgpage == page && sg->offset == sgoffset + sglen)
1423 sglen += sg->length;
1424 else {
1425 /* make sure the sgl is fit for ddp:
1426 * each has the same page size, and
1427 * all of the middle pages are used completely
1428 */
1429 if ((j && sgoffset) || ((i != sgcnt - 1) &&
1430 ((sglen + sgoffset) & ~PAGE_MASK))) {
1431 log_debug(1 << CXGBI_DBG_DDP,
1432 "page %d/%u, %u + %u.\n",
1433 i, sgcnt, sgoffset, sglen);
1434 goto error_out;
1435 }
1436
1437 j++;
1438 if (j == gl->nelem || sg->offset) {
1439 log_debug(1 << CXGBI_DBG_DDP,
1440 "page %d/%u, offset %u.\n",
1441 j, gl->nelem, sg->offset);
1442 goto error_out;
1443 }
1444 gl->pages[j] = page;
1445 sglen = sg->length;
1446 sgoffset = sg->offset;
1447 sgpage = page;
1448 }
1449 }
1450 gl->nelem = ++j;
1451
1452 if (ddp_gl_map(pdev, gl) < 0)
1453 goto error_out;
1454
1455 return gl;
1456
1457 error_out:
1458 kfree(gl);
1459 return NULL;
1460 }
1461
1462 static void ddp_tag_release(struct cxgbi_hba *chba, u32 tag)
1463 {
1464 struct cxgbi_device *cdev = chba->cdev;
1465 struct cxgbi_ddp_info *ddp = cdev->ddp;
1466 u32 idx;
1467
1468 idx = (tag >> PPOD_IDX_SHIFT) & ddp->idx_mask;
1469 if (idx < ddp->nppods) {
1470 struct cxgbi_gather_list *gl = ddp->gl_map[idx];
1471 unsigned int npods;
1472
1473 if (!gl || !gl->nelem) {
1474 pr_warn("tag 0x%x, idx %u, gl 0x%p, %u.\n",
1475 tag, idx, gl, gl ? gl->nelem : 0);
1476 return;
1477 }
1478 npods = (gl->nelem + PPOD_PAGES_MAX - 1) >> PPOD_PAGES_SHIFT;
1479 log_debug(1 << CXGBI_DBG_DDP,
1480 "tag 0x%x, release idx %u, npods %u.\n",
1481 tag, idx, npods);
1482 cdev->csk_ddp_clear(chba, tag, idx, npods);
1483 ddp_unmark_entries(ddp, idx, npods);
1484 ddp_release_gl(gl, ddp->pdev);
1485 } else
1486 pr_warn("tag 0x%x, idx %u > max %u.\n", tag, idx, ddp->nppods);
1487 }
1488
1489 static int ddp_tag_reserve(struct cxgbi_sock *csk, unsigned int tid,
1490 u32 sw_tag, u32 *tagp, struct cxgbi_gather_list *gl,
1491 gfp_t gfp)
1492 {
1493 struct cxgbi_device *cdev = csk->cdev;
1494 struct cxgbi_ddp_info *ddp = cdev->ddp;
1495 struct cxgbi_tag_format *tformat = &cdev->tag_format;
1496 struct cxgbi_pagepod_hdr hdr;
1497 unsigned int npods;
1498 int idx = -1;
1499 int err = -ENOMEM;
1500 u32 tag;
1501
1502 npods = (gl->nelem + PPOD_PAGES_MAX - 1) >> PPOD_PAGES_SHIFT;
1503 if (ddp->idx_last == ddp->nppods)
1504 idx = ddp_find_unused_entries(ddp, 0, ddp->nppods,
1505 npods, gl);
1506 else {
1507 idx = ddp_find_unused_entries(ddp, ddp->idx_last + 1,
1508 ddp->nppods, npods,
1509 gl);
1510 if (idx < 0 && ddp->idx_last >= npods) {
1511 idx = ddp_find_unused_entries(ddp, 0,
1512 min(ddp->idx_last + npods, ddp->nppods),
1513 npods, gl);
1514 }
1515 }
1516 if (idx < 0) {
1517 log_debug(1 << CXGBI_DBG_DDP,
1518 "xferlen %u, gl %u, npods %u NO DDP.\n",
1519 gl->length, gl->nelem, npods);
1520 return idx;
1521 }
1522
1523 tag = cxgbi_ddp_tag_base(tformat, sw_tag);
1524 tag |= idx << PPOD_IDX_SHIFT;
1525
1526 hdr.rsvd = 0;
1527 hdr.vld_tid = htonl(PPOD_VALID_FLAG | PPOD_TID(tid));
1528 hdr.pgsz_tag_clr = htonl(tag & ddp->rsvd_tag_mask);
1529 hdr.max_offset = htonl(gl->length);
1530 hdr.page_offset = htonl(gl->offset);
1531
1532 err = cdev->csk_ddp_set(csk, &hdr, idx, npods, gl);
1533 if (err < 0)
1534 goto unmark_entries;
1535
1536 ddp->idx_last = idx;
1537 log_debug(1 << CXGBI_DBG_DDP,
1538 "xfer %u, gl %u,%u, tid 0x%x, tag 0x%x->0x%x(%u,%u).\n",
1539 gl->length, gl->nelem, gl->offset, tid, sw_tag, tag, idx,
1540 npods);
1541 *tagp = tag;
1542 return 0;
1543
1544 unmark_entries:
1545 ddp_unmark_entries(ddp, idx, npods);
1546 return err;
1547 }
1548
1549 int cxgbi_ddp_reserve(struct cxgbi_sock *csk, unsigned int *tagp,
1550 unsigned int sw_tag, unsigned int xferlen,
1551 struct scatterlist *sgl, unsigned int sgcnt, gfp_t gfp)
1552 {
1553 struct cxgbi_device *cdev = csk->cdev;
1554 struct cxgbi_tag_format *tformat = &cdev->tag_format;
1555 struct cxgbi_gather_list *gl;
1556 int err;
1557
1558 if (page_idx >= DDP_PGIDX_MAX || !cdev->ddp ||
1559 xferlen < DDP_THRESHOLD) {
1560 log_debug(1 << CXGBI_DBG_DDP,
1561 "pgidx %u, xfer %u, NO ddp.\n", page_idx, xferlen);
1562 return -EINVAL;
1563 }
1564
1565 if (!cxgbi_sw_tag_usable(tformat, sw_tag)) {
1566 log_debug(1 << CXGBI_DBG_DDP,
1567 "sw_tag 0x%x NOT usable.\n", sw_tag);
1568 return -EINVAL;
1569 }
1570
1571 gl = ddp_make_gl(xferlen, sgl, sgcnt, cdev->pdev, gfp);
1572 if (!gl)
1573 return -ENOMEM;
1574
1575 err = ddp_tag_reserve(csk, csk->tid, sw_tag, tagp, gl, gfp);
1576 if (err < 0)
1577 ddp_release_gl(gl, cdev->pdev);
1578
1579 return err;
1580 }
1581
1582 static void ddp_destroy(struct kref *kref)
1583 {
1584 struct cxgbi_ddp_info *ddp = container_of(kref,
1585 struct cxgbi_ddp_info,
1586 refcnt);
1587 struct cxgbi_device *cdev = ddp->cdev;
1588 int i = 0;
1589
1590 pr_info("kref 0, destroy ddp 0x%p, cdev 0x%p.\n", ddp, cdev);
1591
1592 while (i < ddp->nppods) {
1593 struct cxgbi_gather_list *gl = ddp->gl_map[i];
1594
1595 if (gl) {
1596 int npods = (gl->nelem + PPOD_PAGES_MAX - 1)
1597 >> PPOD_PAGES_SHIFT;
1598 pr_info("cdev 0x%p, ddp %d + %d.\n", cdev, i, npods);
1599 kfree(gl);
1600 i += npods;
1601 } else
1602 i++;
1603 }
1604 cxgbi_free_big_mem(ddp);
1605 }
1606
1607 int cxgbi_ddp_cleanup(struct cxgbi_device *cdev)
1608 {
1609 struct cxgbi_ddp_info *ddp = cdev->ddp;
1610
1611 log_debug(1 << CXGBI_DBG_DDP,
1612 "cdev 0x%p, release ddp 0x%p.\n", cdev, ddp);
1613 cdev->ddp = NULL;
1614 if (ddp)
1615 return kref_put(&ddp->refcnt, ddp_destroy);
1616 return 0;
1617 }
1618 EXPORT_SYMBOL_GPL(cxgbi_ddp_cleanup);
1619
1620 int cxgbi_ddp_init(struct cxgbi_device *cdev,
1621 unsigned int llimit, unsigned int ulimit,
1622 unsigned int max_txsz, unsigned int max_rxsz)
1623 {
1624 struct cxgbi_ddp_info *ddp;
1625 unsigned int ppmax, bits;
1626
1627 ppmax = (ulimit - llimit + 1) >> PPOD_SIZE_SHIFT;
1628 bits = __ilog2_u32(ppmax) + 1;
1629 if (bits > PPOD_IDX_MAX_SIZE)
1630 bits = PPOD_IDX_MAX_SIZE;
1631 ppmax = (1 << (bits - 1)) - 1;
1632
1633 ddp = cxgbi_alloc_big_mem(sizeof(struct cxgbi_ddp_info) +
1634 ppmax * (sizeof(struct cxgbi_gather_list *) +
1635 sizeof(struct sk_buff *)),
1636 GFP_KERNEL);
1637 if (!ddp) {
1638 pr_warn("cdev 0x%p, ddp ppmax %u OOM.\n", cdev, ppmax);
1639 return -ENOMEM;
1640 }
1641 ddp->gl_map = (struct cxgbi_gather_list **)(ddp + 1);
1642 cdev->ddp = ddp;
1643
1644 spin_lock_init(&ddp->map_lock);
1645 kref_init(&ddp->refcnt);
1646
1647 ddp->cdev = cdev;
1648 ddp->pdev = cdev->pdev;
1649 ddp->llimit = llimit;
1650 ddp->ulimit = ulimit;
1651 ddp->max_txsz = min_t(unsigned int, max_txsz, ULP2_MAX_PKT_SIZE);
1652 ddp->max_rxsz = min_t(unsigned int, max_rxsz, ULP2_MAX_PKT_SIZE);
1653 ddp->nppods = ppmax;
1654 ddp->idx_last = ppmax;
1655 ddp->idx_bits = bits;
1656 ddp->idx_mask = (1 << bits) - 1;
1657 ddp->rsvd_tag_mask = (1 << (bits + PPOD_IDX_SHIFT)) - 1;
1658
1659 cdev->tag_format.sw_bits = sw_tag_idx_bits + sw_tag_age_bits;
1660 cdev->tag_format.rsvd_bits = ddp->idx_bits;
1661 cdev->tag_format.rsvd_shift = PPOD_IDX_SHIFT;
1662 cdev->tag_format.rsvd_mask = (1 << cdev->tag_format.rsvd_bits) - 1;
1663
1664 pr_info("%s tag format, sw %u, rsvd %u,%u, mask 0x%x.\n",
1665 cdev->ports[0]->name, cdev->tag_format.sw_bits,
1666 cdev->tag_format.rsvd_bits, cdev->tag_format.rsvd_shift,
1667 cdev->tag_format.rsvd_mask);
1668
1669 cdev->tx_max_size = min_t(unsigned int, ULP2_MAX_PDU_PAYLOAD,
1670 ddp->max_txsz - ISCSI_PDU_NONPAYLOAD_LEN);
1671 cdev->rx_max_size = min_t(unsigned int, ULP2_MAX_PDU_PAYLOAD,
1672 ddp->max_rxsz - ISCSI_PDU_NONPAYLOAD_LEN);
1673
1674 log_debug(1 << CXGBI_DBG_DDP,
1675 "%s max payload size: %u/%u, %u/%u.\n",
1676 cdev->ports[0]->name, cdev->tx_max_size, ddp->max_txsz,
1677 cdev->rx_max_size, ddp->max_rxsz);
1678 return 0;
1679 }
1680 EXPORT_SYMBOL_GPL(cxgbi_ddp_init);
1681
1682 /*
1683 * APIs interacting with open-iscsi libraries
1684 */
1685
1686 static unsigned char padding[4];
1687
1688 static void task_release_itt(struct iscsi_task *task, itt_t hdr_itt)
1689 {
1690 struct scsi_cmnd *sc = task->sc;
1691 struct iscsi_tcp_conn *tcp_conn = task->conn->dd_data;
1692 struct cxgbi_conn *cconn = tcp_conn->dd_data;
1693 struct cxgbi_hba *chba = cconn->chba;
1694 struct cxgbi_tag_format *tformat = &chba->cdev->tag_format;
1695 u32 tag = ntohl((__force u32)hdr_itt);
1696
1697 log_debug(1 << CXGBI_DBG_DDP,
1698 "cdev 0x%p, release tag 0x%x.\n", chba->cdev, tag);
1699 if (sc &&
1700 (scsi_bidi_cmnd(sc) || sc->sc_data_direction == DMA_FROM_DEVICE) &&
1701 cxgbi_is_ddp_tag(tformat, tag))
1702 ddp_tag_release(chba, tag);
1703 }
1704
1705 static int task_reserve_itt(struct iscsi_task *task, itt_t *hdr_itt)
1706 {
1707 struct scsi_cmnd *sc = task->sc;
1708 struct iscsi_conn *conn = task->conn;
1709 struct iscsi_session *sess = conn->session;
1710 struct iscsi_tcp_conn *tcp_conn = conn->dd_data;
1711 struct cxgbi_conn *cconn = tcp_conn->dd_data;
1712 struct cxgbi_hba *chba = cconn->chba;
1713 struct cxgbi_tag_format *tformat = &chba->cdev->tag_format;
1714 u32 sw_tag = (sess->age << cconn->task_idx_bits) | task->itt;
1715 u32 tag = 0;
1716 int err = -EINVAL;
1717
1718 if (sc &&
1719 (scsi_bidi_cmnd(sc) || sc->sc_data_direction == DMA_FROM_DEVICE)) {
1720 err = cxgbi_ddp_reserve(cconn->cep->csk, &tag, sw_tag,
1721 scsi_in(sc)->length,
1722 scsi_in(sc)->table.sgl,
1723 scsi_in(sc)->table.nents,
1724 GFP_ATOMIC);
1725 if (err < 0)
1726 log_debug(1 << CXGBI_DBG_DDP,
1727 "csk 0x%p, R task 0x%p, %u,%u, no ddp.\n",
1728 cconn->cep->csk, task, scsi_in(sc)->length,
1729 scsi_in(sc)->table.nents);
1730 }
1731
1732 if (err < 0)
1733 tag = cxgbi_set_non_ddp_tag(tformat, sw_tag);
1734 /* the itt need to sent in big-endian order */
1735 *hdr_itt = (__force itt_t)htonl(tag);
1736
1737 log_debug(1 << CXGBI_DBG_DDP,
1738 "cdev 0x%p, task 0x%p, 0x%x(0x%x,0x%x)->0x%x/0x%x.\n",
1739 chba->cdev, task, sw_tag, task->itt, sess->age, tag, *hdr_itt);
1740 return 0;
1741 }
1742
1743 void cxgbi_parse_pdu_itt(struct iscsi_conn *conn, itt_t itt, int *idx, int *age)
1744 {
1745 struct iscsi_tcp_conn *tcp_conn = conn->dd_data;
1746 struct cxgbi_conn *cconn = tcp_conn->dd_data;
1747 struct cxgbi_device *cdev = cconn->chba->cdev;
1748 u32 tag = ntohl((__force u32) itt);
1749 u32 sw_bits;
1750
1751 sw_bits = cxgbi_tag_nonrsvd_bits(&cdev->tag_format, tag);
1752 if (idx)
1753 *idx = sw_bits & ((1 << cconn->task_idx_bits) - 1);
1754 if (age)
1755 *age = (sw_bits >> cconn->task_idx_bits) & ISCSI_AGE_MASK;
1756
1757 log_debug(1 << CXGBI_DBG_DDP,
1758 "cdev 0x%p, tag 0x%x/0x%x, -> 0x%x(0x%x,0x%x).\n",
1759 cdev, tag, itt, sw_bits, idx ? *idx : 0xFFFFF,
1760 age ? *age : 0xFF);
1761 }
1762 EXPORT_SYMBOL_GPL(cxgbi_parse_pdu_itt);
1763
1764 void cxgbi_conn_tx_open(struct cxgbi_sock *csk)
1765 {
1766 struct iscsi_conn *conn = csk->user_data;
1767
1768 if (conn) {
1769 log_debug(1 << CXGBI_DBG_SOCK,
1770 "csk 0x%p, cid %d.\n", csk, conn->id);
1771 iscsi_conn_queue_work(conn);
1772 }
1773 }
1774 EXPORT_SYMBOL_GPL(cxgbi_conn_tx_open);
1775
1776 /*
1777 * pdu receive, interact with libiscsi_tcp
1778 */
1779 static inline int read_pdu_skb(struct iscsi_conn *conn,
1780 struct sk_buff *skb,
1781 unsigned int offset,
1782 int offloaded)
1783 {
1784 int status = 0;
1785 int bytes_read;
1786
1787 bytes_read = iscsi_tcp_recv_skb(conn, skb, offset, offloaded, &status);
1788 switch (status) {
1789 case ISCSI_TCP_CONN_ERR:
1790 pr_info("skb 0x%p, off %u, %d, TCP_ERR.\n",
1791 skb, offset, offloaded);
1792 return -EIO;
1793 case ISCSI_TCP_SUSPENDED:
1794 log_debug(1 << CXGBI_DBG_PDU_RX,
1795 "skb 0x%p, off %u, %d, TCP_SUSPEND, rc %d.\n",
1796 skb, offset, offloaded, bytes_read);
1797 /* no transfer - just have caller flush queue */
1798 return bytes_read;
1799 case ISCSI_TCP_SKB_DONE:
1800 pr_info("skb 0x%p, off %u, %d, TCP_SKB_DONE.\n",
1801 skb, offset, offloaded);
1802 /*
1803 * pdus should always fit in the skb and we should get
1804 * segment done notifcation.
1805 */
1806 iscsi_conn_printk(KERN_ERR, conn, "Invalid pdu or skb.");
1807 return -EFAULT;
1808 case ISCSI_TCP_SEGMENT_DONE:
1809 log_debug(1 << CXGBI_DBG_PDU_RX,
1810 "skb 0x%p, off %u, %d, TCP_SEG_DONE, rc %d.\n",
1811 skb, offset, offloaded, bytes_read);
1812 return bytes_read;
1813 default:
1814 pr_info("skb 0x%p, off %u, %d, invalid status %d.\n",
1815 skb, offset, offloaded, status);
1816 return -EINVAL;
1817 }
1818 }
1819
1820 static int skb_read_pdu_bhs(struct iscsi_conn *conn, struct sk_buff *skb)
1821 {
1822 struct iscsi_tcp_conn *tcp_conn = conn->dd_data;
1823
1824 log_debug(1 << CXGBI_DBG_PDU_RX,
1825 "conn 0x%p, skb 0x%p, len %u, flag 0x%lx.\n",
1826 conn, skb, skb->len, cxgbi_skcb_flags(skb));
1827
1828 if (!iscsi_tcp_recv_segment_is_hdr(tcp_conn)) {
1829 pr_info("conn 0x%p, skb 0x%p, not hdr.\n", conn, skb);
1830 iscsi_conn_failure(conn, ISCSI_ERR_PROTO);
1831 return -EIO;
1832 }
1833
1834 if (conn->hdrdgst_en &&
1835 cxgbi_skcb_test_flag(skb, SKCBF_RX_HCRC_ERR)) {
1836 pr_info("conn 0x%p, skb 0x%p, hcrc.\n", conn, skb);
1837 iscsi_conn_failure(conn, ISCSI_ERR_HDR_DGST);
1838 return -EIO;
1839 }
1840
1841 return read_pdu_skb(conn, skb, 0, 0);
1842 }
1843
1844 static int skb_read_pdu_data(struct iscsi_conn *conn, struct sk_buff *lskb,
1845 struct sk_buff *skb, unsigned int offset)
1846 {
1847 struct iscsi_tcp_conn *tcp_conn = conn->dd_data;
1848 bool offloaded = 0;
1849 int opcode = tcp_conn->in.hdr->opcode & ISCSI_OPCODE_MASK;
1850
1851 log_debug(1 << CXGBI_DBG_PDU_RX,
1852 "conn 0x%p, skb 0x%p, len %u, flag 0x%lx.\n",
1853 conn, skb, skb->len, cxgbi_skcb_flags(skb));
1854
1855 if (conn->datadgst_en &&
1856 cxgbi_skcb_test_flag(lskb, SKCBF_RX_DCRC_ERR)) {
1857 pr_info("conn 0x%p, skb 0x%p, dcrc 0x%lx.\n",
1858 conn, lskb, cxgbi_skcb_flags(lskb));
1859 iscsi_conn_failure(conn, ISCSI_ERR_DATA_DGST);
1860 return -EIO;
1861 }
1862
1863 if (iscsi_tcp_recv_segment_is_hdr(tcp_conn))
1864 return 0;
1865
1866 /* coalesced, add header digest length */
1867 if (lskb == skb && conn->hdrdgst_en)
1868 offset += ISCSI_DIGEST_SIZE;
1869
1870 if (cxgbi_skcb_test_flag(lskb, SKCBF_RX_DATA_DDPD))
1871 offloaded = 1;
1872
1873 if (opcode == ISCSI_OP_SCSI_DATA_IN)
1874 log_debug(1 << CXGBI_DBG_PDU_RX,
1875 "skb 0x%p, op 0x%x, itt 0x%x, %u %s ddp'ed.\n",
1876 skb, opcode, ntohl(tcp_conn->in.hdr->itt),
1877 tcp_conn->in.datalen, offloaded ? "is" : "not");
1878
1879 return read_pdu_skb(conn, skb, offset, offloaded);
1880 }
1881
1882 static void csk_return_rx_credits(struct cxgbi_sock *csk, int copied)
1883 {
1884 struct cxgbi_device *cdev = csk->cdev;
1885 int must_send;
1886 u32 credits;
1887
1888 log_debug(1 << CXGBI_DBG_PDU_RX,
1889 "csk 0x%p,%u,0x%lx,%u, seq %u, wup %u, thre %u, %u.\n",
1890 csk, csk->state, csk->flags, csk->tid, csk->copied_seq,
1891 csk->rcv_wup, cdev->rx_credit_thres,
1892 csk->rcv_win);
1893
1894 if (csk->state != CTP_ESTABLISHED)
1895 return;
1896
1897 credits = csk->copied_seq - csk->rcv_wup;
1898 if (unlikely(!credits))
1899 return;
1900 if (unlikely(cdev->rx_credit_thres == 0))
1901 return;
1902
1903 must_send = credits + 16384 >= csk->rcv_win;
1904 if (must_send || credits >= cdev->rx_credit_thres)
1905 csk->rcv_wup += cdev->csk_send_rx_credits(csk, credits);
1906 }
1907
1908 void cxgbi_conn_pdu_ready(struct cxgbi_sock *csk)
1909 {
1910 struct cxgbi_device *cdev = csk->cdev;
1911 struct iscsi_conn *conn = csk->user_data;
1912 struct sk_buff *skb;
1913 unsigned int read = 0;
1914 int err = 0;
1915
1916 log_debug(1 << CXGBI_DBG_PDU_RX,
1917 "csk 0x%p, conn 0x%p.\n", csk, conn);
1918
1919 if (unlikely(!conn || conn->suspend_rx)) {
1920 log_debug(1 << CXGBI_DBG_PDU_RX,
1921 "csk 0x%p, conn 0x%p, id %d, suspend_rx %lu!\n",
1922 csk, conn, conn ? conn->id : 0xFF,
1923 conn ? conn->suspend_rx : 0xFF);
1924 return;
1925 }
1926
1927 while (!err) {
1928 skb = skb_peek(&csk->receive_queue);
1929 if (!skb ||
1930 !(cxgbi_skcb_test_flag(skb, SKCBF_RX_STATUS))) {
1931 if (skb)
1932 log_debug(1 << CXGBI_DBG_PDU_RX,
1933 "skb 0x%p, NOT ready 0x%lx.\n",
1934 skb, cxgbi_skcb_flags(skb));
1935 break;
1936 }
1937 __skb_unlink(skb, &csk->receive_queue);
1938
1939 read += cxgbi_skcb_rx_pdulen(skb);
1940 log_debug(1 << CXGBI_DBG_PDU_RX,
1941 "csk 0x%p, skb 0x%p,%u,f 0x%lx, pdu len %u.\n",
1942 csk, skb, skb->len, cxgbi_skcb_flags(skb),
1943 cxgbi_skcb_rx_pdulen(skb));
1944
1945 if (cxgbi_skcb_test_flag(skb, SKCBF_RX_COALESCED)) {
1946 err = skb_read_pdu_bhs(conn, skb);
1947 if (err < 0) {
1948 pr_err("coalesced bhs, csk 0x%p, skb 0x%p,%u, "
1949 "f 0x%lx, plen %u.\n",
1950 csk, skb, skb->len,
1951 cxgbi_skcb_flags(skb),
1952 cxgbi_skcb_rx_pdulen(skb));
1953 goto skb_done;
1954 }
1955 err = skb_read_pdu_data(conn, skb, skb,
1956 err + cdev->skb_rx_extra);
1957 if (err < 0)
1958 pr_err("coalesced data, csk 0x%p, skb 0x%p,%u, "
1959 "f 0x%lx, plen %u.\n",
1960 csk, skb, skb->len,
1961 cxgbi_skcb_flags(skb),
1962 cxgbi_skcb_rx_pdulen(skb));
1963 } else {
1964 err = skb_read_pdu_bhs(conn, skb);
1965 if (err < 0) {
1966 pr_err("bhs, csk 0x%p, skb 0x%p,%u, "
1967 "f 0x%lx, plen %u.\n",
1968 csk, skb, skb->len,
1969 cxgbi_skcb_flags(skb),
1970 cxgbi_skcb_rx_pdulen(skb));
1971 goto skb_done;
1972 }
1973
1974 if (cxgbi_skcb_test_flag(skb, SKCBF_RX_DATA)) {
1975 struct sk_buff *dskb;
1976
1977 dskb = skb_peek(&csk->receive_queue);
1978 if (!dskb) {
1979 pr_err("csk 0x%p, skb 0x%p,%u, f 0x%lx,"
1980 " plen %u, NO data.\n",
1981 csk, skb, skb->len,
1982 cxgbi_skcb_flags(skb),
1983 cxgbi_skcb_rx_pdulen(skb));
1984 err = -EIO;
1985 goto skb_done;
1986 }
1987 __skb_unlink(dskb, &csk->receive_queue);
1988
1989 err = skb_read_pdu_data(conn, skb, dskb, 0);
1990 if (err < 0)
1991 pr_err("data, csk 0x%p, skb 0x%p,%u, "
1992 "f 0x%lx, plen %u, dskb 0x%p,"
1993 "%u.\n",
1994 csk, skb, skb->len,
1995 cxgbi_skcb_flags(skb),
1996 cxgbi_skcb_rx_pdulen(skb),
1997 dskb, dskb->len);
1998 __kfree_skb(dskb);
1999 } else
2000 err = skb_read_pdu_data(conn, skb, skb, 0);
2001 }
2002 skb_done:
2003 __kfree_skb(skb);
2004
2005 if (err < 0)
2006 break;
2007 }
2008
2009 log_debug(1 << CXGBI_DBG_PDU_RX, "csk 0x%p, read %u.\n", csk, read);
2010 if (read) {
2011 csk->copied_seq += read;
2012 csk_return_rx_credits(csk, read);
2013 conn->rxdata_octets += read;
2014 }
2015
2016 if (err < 0) {
2017 pr_info("csk 0x%p, 0x%p, rx failed %d, read %u.\n",
2018 csk, conn, err, read);
2019 iscsi_conn_failure(conn, ISCSI_ERR_CONN_FAILED);
2020 }
2021 }
2022 EXPORT_SYMBOL_GPL(cxgbi_conn_pdu_ready);
2023
2024 static int sgl_seek_offset(struct scatterlist *sgl, unsigned int sgcnt,
2025 unsigned int offset, unsigned int *off,
2026 struct scatterlist **sgp)
2027 {
2028 int i;
2029 struct scatterlist *sg;
2030
2031 for_each_sg(sgl, sg, sgcnt, i) {
2032 if (offset < sg->length) {
2033 *off = offset;
2034 *sgp = sg;
2035 return 0;
2036 }
2037 offset -= sg->length;
2038 }
2039 return -EFAULT;
2040 }
2041
2042 static int sgl_read_to_frags(struct scatterlist *sg, unsigned int sgoffset,
2043 unsigned int dlen, struct page_frag *frags,
2044 int frag_max)
2045 {
2046 unsigned int datalen = dlen;
2047 unsigned int sglen = sg->length - sgoffset;
2048 struct page *page = sg_page(sg);
2049 int i;
2050
2051 i = 0;
2052 do {
2053 unsigned int copy;
2054
2055 if (!sglen) {
2056 sg = sg_next(sg);
2057 if (!sg) {
2058 pr_warn("sg %d NULL, len %u/%u.\n",
2059 i, datalen, dlen);
2060 return -EINVAL;
2061 }
2062 sgoffset = 0;
2063 sglen = sg->length;
2064 page = sg_page(sg);
2065
2066 }
2067 copy = min(datalen, sglen);
2068 if (i && page == frags[i - 1].page &&
2069 sgoffset + sg->offset ==
2070 frags[i - 1].offset + frags[i - 1].size) {
2071 frags[i - 1].size += copy;
2072 } else {
2073 if (i >= frag_max) {
2074 pr_warn("too many pages %u, dlen %u.\n",
2075 frag_max, dlen);
2076 return -EINVAL;
2077 }
2078
2079 frags[i].page = page;
2080 frags[i].offset = sg->offset + sgoffset;
2081 frags[i].size = copy;
2082 i++;
2083 }
2084 datalen -= copy;
2085 sgoffset += copy;
2086 sglen -= copy;
2087 } while (datalen);
2088
2089 return i;
2090 }
2091
2092 int cxgbi_conn_alloc_pdu(struct iscsi_task *task, u8 opcode)
2093 {
2094 struct iscsi_tcp_conn *tcp_conn = task->conn->dd_data;
2095 struct cxgbi_conn *cconn = tcp_conn->dd_data;
2096 struct cxgbi_device *cdev = cconn->chba->cdev;
2097 struct iscsi_conn *conn = task->conn;
2098 struct iscsi_tcp_task *tcp_task = task->dd_data;
2099 struct cxgbi_task_data *tdata = iscsi_task_cxgbi_data(task);
2100 struct scsi_cmnd *sc = task->sc;
2101 int headroom = SKB_TX_ISCSI_PDU_HEADER_MAX;
2102
2103 tcp_task->dd_data = tdata;
2104 task->hdr = NULL;
2105
2106 if (SKB_MAX_HEAD(cdev->skb_tx_rsvd) > (512 * MAX_SKB_FRAGS) &&
2107 (opcode == ISCSI_OP_SCSI_DATA_OUT ||
2108 (opcode == ISCSI_OP_SCSI_CMD &&
2109 (scsi_bidi_cmnd(sc) || sc->sc_data_direction == DMA_TO_DEVICE))))
2110 /* data could goes into skb head */
2111 headroom += min_t(unsigned int,
2112 SKB_MAX_HEAD(cdev->skb_tx_rsvd),
2113 conn->max_xmit_dlength);
2114
2115 tdata->skb = alloc_skb(cdev->skb_tx_rsvd + headroom, GFP_ATOMIC);
2116 if (!tdata->skb) {
2117 struct cxgbi_sock *csk = cconn->cep->csk;
2118 struct net_device *ndev = cdev->ports[csk->port_id];
2119 ndev->stats.tx_dropped++;
2120 return -ENOMEM;
2121 }
2122
2123 skb_reserve(tdata->skb, cdev->skb_tx_rsvd);
2124 task->hdr = (struct iscsi_hdr *)tdata->skb->data;
2125 task->hdr_max = SKB_TX_ISCSI_PDU_HEADER_MAX; /* BHS + AHS */
2126
2127 /* data_out uses scsi_cmd's itt */
2128 if (opcode != ISCSI_OP_SCSI_DATA_OUT)
2129 task_reserve_itt(task, &task->hdr->itt);
2130
2131 log_debug(1 << CXGBI_DBG_ISCSI | 1 << CXGBI_DBG_PDU_TX,
2132 "task 0x%p, op 0x%x, skb 0x%p,%u+%u/%u, itt 0x%x.\n",
2133 task, opcode, tdata->skb, cdev->skb_tx_rsvd, headroom,
2134 conn->max_xmit_dlength, ntohl(task->hdr->itt));
2135
2136 return 0;
2137 }
2138 EXPORT_SYMBOL_GPL(cxgbi_conn_alloc_pdu);
2139
2140 static inline void tx_skb_setmode(struct sk_buff *skb, int hcrc, int dcrc)
2141 {
2142 if (hcrc || dcrc) {
2143 u8 submode = 0;
2144
2145 if (hcrc)
2146 submode |= 1;
2147 if (dcrc)
2148 submode |= 2;
2149 cxgbi_skcb_ulp_mode(skb) = (ULP2_MODE_ISCSI << 4) | submode;
2150 } else
2151 cxgbi_skcb_ulp_mode(skb) = 0;
2152 }
2153
2154 int cxgbi_conn_init_pdu(struct iscsi_task *task, unsigned int offset,
2155 unsigned int count)
2156 {
2157 struct iscsi_conn *conn = task->conn;
2158 struct cxgbi_task_data *tdata = iscsi_task_cxgbi_data(task);
2159 struct sk_buff *skb = tdata->skb;
2160 unsigned int datalen = count;
2161 int i, padlen = iscsi_padding(count);
2162 struct page *pg;
2163
2164 log_debug(1 << CXGBI_DBG_ISCSI | 1 << CXGBI_DBG_PDU_TX,
2165 "task 0x%p,0x%p, skb 0x%p, 0x%x,0x%x,0x%x, %u+%u.\n",
2166 task, task->sc, skb, (*skb->data) & ISCSI_OPCODE_MASK,
2167 ntohl(task->cmdsn), ntohl(task->hdr->itt), offset, count);
2168
2169 skb_put(skb, task->hdr_len);
2170 tx_skb_setmode(skb, conn->hdrdgst_en, datalen ? conn->datadgst_en : 0);
2171 if (!count)
2172 return 0;
2173
2174 if (task->sc) {
2175 struct scsi_data_buffer *sdb = scsi_out(task->sc);
2176 struct scatterlist *sg = NULL;
2177 int err;
2178
2179 tdata->offset = offset;
2180 tdata->count = count;
2181 err = sgl_seek_offset(
2182 sdb->table.sgl, sdb->table.nents,
2183 tdata->offset, &tdata->sgoffset, &sg);
2184 if (err < 0) {
2185 pr_warn("tpdu, sgl %u, bad offset %u/%u.\n",
2186 sdb->table.nents, tdata->offset, sdb->length);
2187 return err;
2188 }
2189 err = sgl_read_to_frags(sg, tdata->sgoffset, tdata->count,
2190 tdata->frags, MAX_PDU_FRAGS);
2191 if (err < 0) {
2192 pr_warn("tpdu, sgl %u, bad offset %u + %u.\n",
2193 sdb->table.nents, tdata->offset, tdata->count);
2194 return err;
2195 }
2196 tdata->nr_frags = err;
2197
2198 if (tdata->nr_frags > MAX_SKB_FRAGS ||
2199 (padlen && tdata->nr_frags == MAX_SKB_FRAGS)) {
2200 char *dst = skb->data + task->hdr_len;
2201 struct page_frag *frag = tdata->frags;
2202
2203 /* data fits in the skb's headroom */
2204 for (i = 0; i < tdata->nr_frags; i++, frag++) {
2205 char *src = kmap_atomic(frag->page);
2206
2207 memcpy(dst, src+frag->offset, frag->size);
2208 dst += frag->size;
2209 kunmap_atomic(src);
2210 }
2211 if (padlen) {
2212 memset(dst, 0, padlen);
2213 padlen = 0;
2214 }
2215 skb_put(skb, count + padlen);
2216 } else {
2217 /* data fit into frag_list */
2218 for (i = 0; i < tdata->nr_frags; i++) {
2219 __skb_fill_page_desc(skb, i,
2220 tdata->frags[i].page,
2221 tdata->frags[i].offset,
2222 tdata->frags[i].size);
2223 skb_frag_ref(skb, i);
2224 }
2225 skb_shinfo(skb)->nr_frags = tdata->nr_frags;
2226 skb->len += count;
2227 skb->data_len += count;
2228 skb->truesize += count;
2229 }
2230
2231 } else {
2232 pg = virt_to_page(task->data);
2233
2234 get_page(pg);
2235 skb_fill_page_desc(skb, 0, pg, offset_in_page(task->data),
2236 count);
2237 skb->len += count;
2238 skb->data_len += count;
2239 skb->truesize += count;
2240 }
2241
2242 if (padlen) {
2243 i = skb_shinfo(skb)->nr_frags;
2244 skb_fill_page_desc(skb, skb_shinfo(skb)->nr_frags,
2245 virt_to_page(padding), offset_in_page(padding),
2246 padlen);
2247
2248 skb->data_len += padlen;
2249 skb->truesize += padlen;
2250 skb->len += padlen;
2251 }
2252
2253 return 0;
2254 }
2255 EXPORT_SYMBOL_GPL(cxgbi_conn_init_pdu);
2256
2257 int cxgbi_conn_xmit_pdu(struct iscsi_task *task)
2258 {
2259 struct iscsi_tcp_conn *tcp_conn = task->conn->dd_data;
2260 struct cxgbi_conn *cconn = tcp_conn->dd_data;
2261 struct cxgbi_task_data *tdata = iscsi_task_cxgbi_data(task);
2262 struct sk_buff *skb = tdata->skb;
2263 unsigned int datalen;
2264 int err;
2265
2266 if (!skb) {
2267 log_debug(1 << CXGBI_DBG_ISCSI | 1 << CXGBI_DBG_PDU_TX,
2268 "task 0x%p, skb NULL.\n", task);
2269 return 0;
2270 }
2271
2272 datalen = skb->data_len;
2273 tdata->skb = NULL;
2274 err = cxgbi_sock_send_pdus(cconn->cep->csk, skb);
2275 if (err > 0) {
2276 int pdulen = err;
2277
2278 log_debug(1 << CXGBI_DBG_PDU_TX,
2279 "task 0x%p,0x%p, skb 0x%p, len %u/%u, rv %d.\n",
2280 task, task->sc, skb, skb->len, skb->data_len, err);
2281
2282 if (task->conn->hdrdgst_en)
2283 pdulen += ISCSI_DIGEST_SIZE;
2284
2285 if (datalen && task->conn->datadgst_en)
2286 pdulen += ISCSI_DIGEST_SIZE;
2287
2288 task->conn->txdata_octets += pdulen;
2289 return 0;
2290 }
2291
2292 if (err == -EAGAIN || err == -ENOBUFS) {
2293 log_debug(1 << CXGBI_DBG_PDU_TX,
2294 "task 0x%p, skb 0x%p, len %u/%u, %d EAGAIN.\n",
2295 task, skb, skb->len, skb->data_len, err);
2296 /* reset skb to send when we are called again */
2297 tdata->skb = skb;
2298 return err;
2299 }
2300
2301 log_debug(1 << CXGBI_DBG_ISCSI | 1 << CXGBI_DBG_PDU_TX,
2302 "itt 0x%x, skb 0x%p, len %u/%u, xmit err %d.\n",
2303 task->itt, skb, skb->len, skb->data_len, err);
2304
2305 kfree_skb(skb);
2306
2307 iscsi_conn_printk(KERN_ERR, task->conn, "xmit err %d.\n", err);
2308 iscsi_conn_failure(task->conn, ISCSI_ERR_XMIT_FAILED);
2309 return err;
2310 }
2311 EXPORT_SYMBOL_GPL(cxgbi_conn_xmit_pdu);
2312
2313 void cxgbi_cleanup_task(struct iscsi_task *task)
2314 {
2315 struct cxgbi_task_data *tdata = iscsi_task_cxgbi_data(task);
2316
2317 log_debug(1 << CXGBI_DBG_ISCSI,
2318 "task 0x%p, skb 0x%p, itt 0x%x.\n",
2319 task, tdata->skb, task->hdr_itt);
2320
2321 /* never reached the xmit task callout */
2322 if (tdata->skb)
2323 __kfree_skb(tdata->skb);
2324 memset(tdata, 0, sizeof(*tdata));
2325
2326 task_release_itt(task, task->hdr_itt);
2327 iscsi_tcp_cleanup_task(task);
2328 }
2329 EXPORT_SYMBOL_GPL(cxgbi_cleanup_task);
2330
2331 void cxgbi_get_conn_stats(struct iscsi_cls_conn *cls_conn,
2332 struct iscsi_stats *stats)
2333 {
2334 struct iscsi_conn *conn = cls_conn->dd_data;
2335
2336 stats->txdata_octets = conn->txdata_octets;
2337 stats->rxdata_octets = conn->rxdata_octets;
2338 stats->scsicmd_pdus = conn->scsicmd_pdus_cnt;
2339 stats->dataout_pdus = conn->dataout_pdus_cnt;
2340 stats->scsirsp_pdus = conn->scsirsp_pdus_cnt;
2341 stats->datain_pdus = conn->datain_pdus_cnt;
2342 stats->r2t_pdus = conn->r2t_pdus_cnt;
2343 stats->tmfcmd_pdus = conn->tmfcmd_pdus_cnt;
2344 stats->tmfrsp_pdus = conn->tmfrsp_pdus_cnt;
2345 stats->digest_err = 0;
2346 stats->timeout_err = 0;
2347 stats->custom_length = 1;
2348 strcpy(stats->custom[0].desc, "eh_abort_cnt");
2349 stats->custom[0].value = conn->eh_abort_cnt;
2350 }
2351 EXPORT_SYMBOL_GPL(cxgbi_get_conn_stats);
2352
2353 static int cxgbi_conn_max_xmit_dlength(struct iscsi_conn *conn)
2354 {
2355 struct iscsi_tcp_conn *tcp_conn = conn->dd_data;
2356 struct cxgbi_conn *cconn = tcp_conn->dd_data;
2357 struct cxgbi_device *cdev = cconn->chba->cdev;
2358 unsigned int headroom = SKB_MAX_HEAD(cdev->skb_tx_rsvd);
2359 unsigned int max_def = 512 * MAX_SKB_FRAGS;
2360 unsigned int max = max(max_def, headroom);
2361
2362 max = min(cconn->chba->cdev->tx_max_size, max);
2363 if (conn->max_xmit_dlength)
2364 conn->max_xmit_dlength = min(conn->max_xmit_dlength, max);
2365 else
2366 conn->max_xmit_dlength = max;
2367 cxgbi_align_pdu_size(conn->max_xmit_dlength);
2368
2369 return 0;
2370 }
2371
2372 static int cxgbi_conn_max_recv_dlength(struct iscsi_conn *conn)
2373 {
2374 struct iscsi_tcp_conn *tcp_conn = conn->dd_data;
2375 struct cxgbi_conn *cconn = tcp_conn->dd_data;
2376 unsigned int max = cconn->chba->cdev->rx_max_size;
2377
2378 cxgbi_align_pdu_size(max);
2379
2380 if (conn->max_recv_dlength) {
2381 if (conn->max_recv_dlength > max) {
2382 pr_err("MaxRecvDataSegmentLength %u > %u.\n",
2383 conn->max_recv_dlength, max);
2384 return -EINVAL;
2385 }
2386 conn->max_recv_dlength = min(conn->max_recv_dlength, max);
2387 cxgbi_align_pdu_size(conn->max_recv_dlength);
2388 } else
2389 conn->max_recv_dlength = max;
2390
2391 return 0;
2392 }
2393
2394 int cxgbi_set_conn_param(struct iscsi_cls_conn *cls_conn,
2395 enum iscsi_param param, char *buf, int buflen)
2396 {
2397 struct iscsi_conn *conn = cls_conn->dd_data;
2398 struct iscsi_tcp_conn *tcp_conn = conn->dd_data;
2399 struct cxgbi_conn *cconn = tcp_conn->dd_data;
2400 struct cxgbi_sock *csk = cconn->cep->csk;
2401 int err;
2402
2403 log_debug(1 << CXGBI_DBG_ISCSI,
2404 "cls_conn 0x%p, param %d, buf(%d) %s.\n",
2405 cls_conn, param, buflen, buf);
2406
2407 switch (param) {
2408 case ISCSI_PARAM_HDRDGST_EN:
2409 err = iscsi_set_param(cls_conn, param, buf, buflen);
2410 if (!err && conn->hdrdgst_en)
2411 err = csk->cdev->csk_ddp_setup_digest(csk, csk->tid,
2412 conn->hdrdgst_en,
2413 conn->datadgst_en, 0);
2414 break;
2415 case ISCSI_PARAM_DATADGST_EN:
2416 err = iscsi_set_param(cls_conn, param, buf, buflen);
2417 if (!err && conn->datadgst_en)
2418 err = csk->cdev->csk_ddp_setup_digest(csk, csk->tid,
2419 conn->hdrdgst_en,
2420 conn->datadgst_en, 0);
2421 break;
2422 case ISCSI_PARAM_MAX_R2T:
2423 return iscsi_tcp_set_max_r2t(conn, buf);
2424 case ISCSI_PARAM_MAX_RECV_DLENGTH:
2425 err = iscsi_set_param(cls_conn, param, buf, buflen);
2426 if (!err)
2427 err = cxgbi_conn_max_recv_dlength(conn);
2428 break;
2429 case ISCSI_PARAM_MAX_XMIT_DLENGTH:
2430 err = iscsi_set_param(cls_conn, param, buf, buflen);
2431 if (!err)
2432 err = cxgbi_conn_max_xmit_dlength(conn);
2433 break;
2434 default:
2435 return iscsi_set_param(cls_conn, param, buf, buflen);
2436 }
2437 return err;
2438 }
2439 EXPORT_SYMBOL_GPL(cxgbi_set_conn_param);
2440
2441 static inline int csk_print_port(struct cxgbi_sock *csk, char *buf)
2442 {
2443 int len;
2444
2445 cxgbi_sock_get(csk);
2446 len = sprintf(buf, "%hu\n", ntohs(csk->daddr.sin_port));
2447 cxgbi_sock_put(csk);
2448
2449 return len;
2450 }
2451
2452 static inline int csk_print_ip(struct cxgbi_sock *csk, char *buf)
2453 {
2454 int len;
2455
2456 cxgbi_sock_get(csk);
2457 if (csk->csk_family == AF_INET)
2458 len = sprintf(buf, "%pI4",
2459 &csk->daddr.sin_addr.s_addr);
2460 else
2461 len = sprintf(buf, "%pI6",
2462 &csk->daddr6.sin6_addr);
2463
2464 cxgbi_sock_put(csk);
2465
2466 return len;
2467 }
2468
2469 int cxgbi_get_ep_param(struct iscsi_endpoint *ep, enum iscsi_param param,
2470 char *buf)
2471 {
2472 struct cxgbi_endpoint *cep = ep->dd_data;
2473 struct cxgbi_sock *csk;
2474 int len;
2475
2476 log_debug(1 << CXGBI_DBG_ISCSI,
2477 "cls_conn 0x%p, param %d.\n", ep, param);
2478
2479 switch (param) {
2480 case ISCSI_PARAM_CONN_PORT:
2481 case ISCSI_PARAM_CONN_ADDRESS:
2482 if (!cep)
2483 return -ENOTCONN;
2484
2485 csk = cep->csk;
2486 if (!csk)
2487 return -ENOTCONN;
2488
2489 return iscsi_conn_get_addr_param((struct sockaddr_storage *)
2490 &csk->daddr, param, buf);
2491 default:
2492 return -ENOSYS;
2493 }
2494 return len;
2495 }
2496 EXPORT_SYMBOL_GPL(cxgbi_get_ep_param);
2497
2498 struct iscsi_cls_conn *
2499 cxgbi_create_conn(struct iscsi_cls_session *cls_session, u32 cid)
2500 {
2501 struct iscsi_cls_conn *cls_conn;
2502 struct iscsi_conn *conn;
2503 struct iscsi_tcp_conn *tcp_conn;
2504 struct cxgbi_conn *cconn;
2505
2506 cls_conn = iscsi_tcp_conn_setup(cls_session, sizeof(*cconn), cid);
2507 if (!cls_conn)
2508 return NULL;
2509
2510 conn = cls_conn->dd_data;
2511 tcp_conn = conn->dd_data;
2512 cconn = tcp_conn->dd_data;
2513 cconn->iconn = conn;
2514
2515 log_debug(1 << CXGBI_DBG_ISCSI,
2516 "cid %u(0x%x), cls 0x%p,0x%p, conn 0x%p,0x%p,0x%p.\n",
2517 cid, cid, cls_session, cls_conn, conn, tcp_conn, cconn);
2518
2519 return cls_conn;
2520 }
2521 EXPORT_SYMBOL_GPL(cxgbi_create_conn);
2522
2523 int cxgbi_bind_conn(struct iscsi_cls_session *cls_session,
2524 struct iscsi_cls_conn *cls_conn,
2525 u64 transport_eph, int is_leading)
2526 {
2527 struct iscsi_conn *conn = cls_conn->dd_data;
2528 struct iscsi_tcp_conn *tcp_conn = conn->dd_data;
2529 struct cxgbi_conn *cconn = tcp_conn->dd_data;
2530 struct iscsi_endpoint *ep;
2531 struct cxgbi_endpoint *cep;
2532 struct cxgbi_sock *csk;
2533 int err;
2534
2535 ep = iscsi_lookup_endpoint(transport_eph);
2536 if (!ep)
2537 return -EINVAL;
2538
2539 /* setup ddp pagesize */
2540 cep = ep->dd_data;
2541 csk = cep->csk;
2542 err = csk->cdev->csk_ddp_setup_pgidx(csk, csk->tid, page_idx, 0);
2543 if (err < 0)
2544 return err;
2545
2546 err = iscsi_conn_bind(cls_session, cls_conn, is_leading);
2547 if (err)
2548 return -EINVAL;
2549
2550 /* calculate the tag idx bits needed for this conn based on cmds_max */
2551 cconn->task_idx_bits = (__ilog2_u32(conn->session->cmds_max - 1)) + 1;
2552
2553 write_lock_bh(&csk->callback_lock);
2554 csk->user_data = conn;
2555 cconn->chba = cep->chba;
2556 cconn->cep = cep;
2557 cep->cconn = cconn;
2558 write_unlock_bh(&csk->callback_lock);
2559
2560 cxgbi_conn_max_xmit_dlength(conn);
2561 cxgbi_conn_max_recv_dlength(conn);
2562
2563 log_debug(1 << CXGBI_DBG_ISCSI,
2564 "cls 0x%p,0x%p, ep 0x%p, cconn 0x%p, csk 0x%p.\n",
2565 cls_session, cls_conn, ep, cconn, csk);
2566 /* init recv engine */
2567 iscsi_tcp_hdr_recv_prep(tcp_conn);
2568
2569 return 0;
2570 }
2571 EXPORT_SYMBOL_GPL(cxgbi_bind_conn);
2572
2573 struct iscsi_cls_session *cxgbi_create_session(struct iscsi_endpoint *ep,
2574 u16 cmds_max, u16 qdepth,
2575 u32 initial_cmdsn)
2576 {
2577 struct cxgbi_endpoint *cep;
2578 struct cxgbi_hba *chba;
2579 struct Scsi_Host *shost;
2580 struct iscsi_cls_session *cls_session;
2581 struct iscsi_session *session;
2582
2583 if (!ep) {
2584 pr_err("missing endpoint.\n");
2585 return NULL;
2586 }
2587
2588 cep = ep->dd_data;
2589 chba = cep->chba;
2590 shost = chba->shost;
2591
2592 BUG_ON(chba != iscsi_host_priv(shost));
2593
2594 cls_session = iscsi_session_setup(chba->cdev->itp, shost,
2595 cmds_max, 0,
2596 sizeof(struct iscsi_tcp_task) +
2597 sizeof(struct cxgbi_task_data),
2598 initial_cmdsn, ISCSI_MAX_TARGET);
2599 if (!cls_session)
2600 return NULL;
2601
2602 session = cls_session->dd_data;
2603 if (iscsi_tcp_r2tpool_alloc(session))
2604 goto remove_session;
2605
2606 log_debug(1 << CXGBI_DBG_ISCSI,
2607 "ep 0x%p, cls sess 0x%p.\n", ep, cls_session);
2608 return cls_session;
2609
2610 remove_session:
2611 iscsi_session_teardown(cls_session);
2612 return NULL;
2613 }
2614 EXPORT_SYMBOL_GPL(cxgbi_create_session);
2615
2616 void cxgbi_destroy_session(struct iscsi_cls_session *cls_session)
2617 {
2618 log_debug(1 << CXGBI_DBG_ISCSI,
2619 "cls sess 0x%p.\n", cls_session);
2620
2621 iscsi_tcp_r2tpool_free(cls_session->dd_data);
2622 iscsi_session_teardown(cls_session);
2623 }
2624 EXPORT_SYMBOL_GPL(cxgbi_destroy_session);
2625
2626 int cxgbi_set_host_param(struct Scsi_Host *shost, enum iscsi_host_param param,
2627 char *buf, int buflen)
2628 {
2629 struct cxgbi_hba *chba = iscsi_host_priv(shost);
2630
2631 if (!chba->ndev) {
2632 shost_printk(KERN_ERR, shost, "Could not get host param. "
2633 "netdev for host not set.\n");
2634 return -ENODEV;
2635 }
2636
2637 log_debug(1 << CXGBI_DBG_ISCSI,
2638 "shost 0x%p, hba 0x%p,%s, param %d, buf(%d) %s.\n",
2639 shost, chba, chba->ndev->name, param, buflen, buf);
2640
2641 switch (param) {
2642 case ISCSI_HOST_PARAM_IPADDRESS:
2643 {
2644 __be32 addr = in_aton(buf);
2645 log_debug(1 << CXGBI_DBG_ISCSI,
2646 "hba %s, req. ipv4 %pI4.\n", chba->ndev->name, &addr);
2647 cxgbi_set_iscsi_ipv4(chba, addr);
2648 return 0;
2649 }
2650 case ISCSI_HOST_PARAM_HWADDRESS:
2651 case ISCSI_HOST_PARAM_NETDEV_NAME:
2652 return 0;
2653 default:
2654 return iscsi_host_set_param(shost, param, buf, buflen);
2655 }
2656 }
2657 EXPORT_SYMBOL_GPL(cxgbi_set_host_param);
2658
2659 int cxgbi_get_host_param(struct Scsi_Host *shost, enum iscsi_host_param param,
2660 char *buf)
2661 {
2662 struct cxgbi_hba *chba = iscsi_host_priv(shost);
2663 int len = 0;
2664
2665 if (!chba->ndev) {
2666 shost_printk(KERN_ERR, shost, "Could not get host param. "
2667 "netdev for host not set.\n");
2668 return -ENODEV;
2669 }
2670
2671 log_debug(1 << CXGBI_DBG_ISCSI,
2672 "shost 0x%p, hba 0x%p,%s, param %d.\n",
2673 shost, chba, chba->ndev->name, param);
2674
2675 switch (param) {
2676 case ISCSI_HOST_PARAM_HWADDRESS:
2677 len = sysfs_format_mac(buf, chba->ndev->dev_addr, 6);
2678 break;
2679 case ISCSI_HOST_PARAM_NETDEV_NAME:
2680 len = sprintf(buf, "%s\n", chba->ndev->name);
2681 break;
2682 case ISCSI_HOST_PARAM_IPADDRESS:
2683 {
2684 struct cxgbi_sock *csk = find_sock_on_port(chba->cdev,
2685 chba->port_id);
2686 if (csk) {
2687 len = sprintf(buf, "%pIS",
2688 (struct sockaddr *)&csk->saddr);
2689 }
2690 log_debug(1 << CXGBI_DBG_ISCSI,
2691 "hba %s, addr %s.\n", chba->ndev->name, buf);
2692 break;
2693 }
2694 default:
2695 return iscsi_host_get_param(shost, param, buf);
2696 }
2697
2698 return len;
2699 }
2700 EXPORT_SYMBOL_GPL(cxgbi_get_host_param);
2701
2702 struct iscsi_endpoint *cxgbi_ep_connect(struct Scsi_Host *shost,
2703 struct sockaddr *dst_addr,
2704 int non_blocking)
2705 {
2706 struct iscsi_endpoint *ep;
2707 struct cxgbi_endpoint *cep;
2708 struct cxgbi_hba *hba = NULL;
2709 struct cxgbi_sock *csk;
2710 int err = -EINVAL;
2711
2712 log_debug(1 << CXGBI_DBG_ISCSI | 1 << CXGBI_DBG_SOCK,
2713 "shost 0x%p, non_blocking %d, dst_addr 0x%p.\n",
2714 shost, non_blocking, dst_addr);
2715
2716 if (shost) {
2717 hba = iscsi_host_priv(shost);
2718 if (!hba) {
2719 pr_info("shost 0x%p, priv NULL.\n", shost);
2720 goto err_out;
2721 }
2722 }
2723
2724 if (dst_addr->sa_family == AF_INET) {
2725 csk = cxgbi_check_route(dst_addr);
2726 #if IS_ENABLED(CONFIG_IPV6)
2727 } else if (dst_addr->sa_family == AF_INET6) {
2728 csk = cxgbi_check_route6(dst_addr);
2729 #endif
2730 } else {
2731 pr_info("address family 0x%x NOT supported.\n",
2732 dst_addr->sa_family);
2733 err = -EAFNOSUPPORT;
2734 return (struct iscsi_endpoint *)ERR_PTR(err);
2735 }
2736
2737 if (IS_ERR(csk))
2738 return (struct iscsi_endpoint *)csk;
2739 cxgbi_sock_get(csk);
2740
2741 if (!hba)
2742 hba = csk->cdev->hbas[csk->port_id];
2743 else if (hba != csk->cdev->hbas[csk->port_id]) {
2744 pr_info("Could not connect through requested host %u"
2745 "hba 0x%p != 0x%p (%u).\n",
2746 shost->host_no, hba,
2747 csk->cdev->hbas[csk->port_id], csk->port_id);
2748 err = -ENOSPC;
2749 goto release_conn;
2750 }
2751
2752 err = sock_get_port(csk);
2753 if (err)
2754 goto release_conn;
2755
2756 cxgbi_sock_set_state(csk, CTP_CONNECTING);
2757 err = csk->cdev->csk_init_act_open(csk);
2758 if (err)
2759 goto release_conn;
2760
2761 if (cxgbi_sock_is_closing(csk)) {
2762 err = -ENOSPC;
2763 pr_info("csk 0x%p is closing.\n", csk);
2764 goto release_conn;
2765 }
2766
2767 ep = iscsi_create_endpoint(sizeof(*cep));
2768 if (!ep) {
2769 err = -ENOMEM;
2770 pr_info("iscsi alloc ep, OOM.\n");
2771 goto release_conn;
2772 }
2773
2774 cep = ep->dd_data;
2775 cep->csk = csk;
2776 cep->chba = hba;
2777
2778 log_debug(1 << CXGBI_DBG_ISCSI | 1 << CXGBI_DBG_SOCK,
2779 "ep 0x%p, cep 0x%p, csk 0x%p, hba 0x%p,%s.\n",
2780 ep, cep, csk, hba, hba->ndev->name);
2781 return ep;
2782
2783 release_conn:
2784 cxgbi_sock_put(csk);
2785 cxgbi_sock_closed(csk);
2786 err_out:
2787 return ERR_PTR(err);
2788 }
2789 EXPORT_SYMBOL_GPL(cxgbi_ep_connect);
2790
2791 int cxgbi_ep_poll(struct iscsi_endpoint *ep, int timeout_ms)
2792 {
2793 struct cxgbi_endpoint *cep = ep->dd_data;
2794 struct cxgbi_sock *csk = cep->csk;
2795
2796 if (!cxgbi_sock_is_established(csk))
2797 return 0;
2798 return 1;
2799 }
2800 EXPORT_SYMBOL_GPL(cxgbi_ep_poll);
2801
2802 void cxgbi_ep_disconnect(struct iscsi_endpoint *ep)
2803 {
2804 struct cxgbi_endpoint *cep = ep->dd_data;
2805 struct cxgbi_conn *cconn = cep->cconn;
2806 struct cxgbi_sock *csk = cep->csk;
2807
2808 log_debug(1 << CXGBI_DBG_ISCSI | 1 << CXGBI_DBG_SOCK,
2809 "ep 0x%p, cep 0x%p, cconn 0x%p, csk 0x%p,%u,0x%lx.\n",
2810 ep, cep, cconn, csk, csk->state, csk->flags);
2811
2812 if (cconn && cconn->iconn) {
2813 iscsi_suspend_tx(cconn->iconn);
2814 write_lock_bh(&csk->callback_lock);
2815 cep->csk->user_data = NULL;
2816 cconn->cep = NULL;
2817 write_unlock_bh(&csk->callback_lock);
2818 }
2819 iscsi_destroy_endpoint(ep);
2820
2821 if (likely(csk->state >= CTP_ESTABLISHED))
2822 need_active_close(csk);
2823 else
2824 cxgbi_sock_closed(csk);
2825
2826 cxgbi_sock_put(csk);
2827 }
2828 EXPORT_SYMBOL_GPL(cxgbi_ep_disconnect);
2829
2830 int cxgbi_iscsi_init(struct iscsi_transport *itp,
2831 struct scsi_transport_template **stt)
2832 {
2833 *stt = iscsi_register_transport(itp);
2834 if (*stt == NULL) {
2835 pr_err("unable to register %s transport 0x%p.\n",
2836 itp->name, itp);
2837 return -ENODEV;
2838 }
2839 log_debug(1 << CXGBI_DBG_ISCSI,
2840 "%s, registered iscsi transport 0x%p.\n",
2841 itp->name, stt);
2842 return 0;
2843 }
2844 EXPORT_SYMBOL_GPL(cxgbi_iscsi_init);
2845
2846 void cxgbi_iscsi_cleanup(struct iscsi_transport *itp,
2847 struct scsi_transport_template **stt)
2848 {
2849 if (*stt) {
2850 log_debug(1 << CXGBI_DBG_ISCSI,
2851 "de-register transport 0x%p, %s, stt 0x%p.\n",
2852 itp, itp->name, *stt);
2853 *stt = NULL;
2854 iscsi_unregister_transport(itp);
2855 }
2856 }
2857 EXPORT_SYMBOL_GPL(cxgbi_iscsi_cleanup);
2858
2859 umode_t cxgbi_attr_is_visible(int param_type, int param)
2860 {
2861 switch (param_type) {
2862 case ISCSI_HOST_PARAM:
2863 switch (param) {
2864 case ISCSI_HOST_PARAM_NETDEV_NAME:
2865 case ISCSI_HOST_PARAM_HWADDRESS:
2866 case ISCSI_HOST_PARAM_IPADDRESS:
2867 case ISCSI_HOST_PARAM_INITIATOR_NAME:
2868 return S_IRUGO;
2869 default:
2870 return 0;
2871 }
2872 case ISCSI_PARAM:
2873 switch (param) {
2874 case ISCSI_PARAM_MAX_RECV_DLENGTH:
2875 case ISCSI_PARAM_MAX_XMIT_DLENGTH:
2876 case ISCSI_PARAM_HDRDGST_EN:
2877 case ISCSI_PARAM_DATADGST_EN:
2878 case ISCSI_PARAM_CONN_ADDRESS:
2879 case ISCSI_PARAM_CONN_PORT:
2880 case ISCSI_PARAM_EXP_STATSN:
2881 case ISCSI_PARAM_PERSISTENT_ADDRESS:
2882 case ISCSI_PARAM_PERSISTENT_PORT:
2883 case ISCSI_PARAM_PING_TMO:
2884 case ISCSI_PARAM_RECV_TMO:
2885 case ISCSI_PARAM_INITIAL_R2T_EN:
2886 case ISCSI_PARAM_MAX_R2T:
2887 case ISCSI_PARAM_IMM_DATA_EN:
2888 case ISCSI_PARAM_FIRST_BURST:
2889 case ISCSI_PARAM_MAX_BURST:
2890 case ISCSI_PARAM_PDU_INORDER_EN:
2891 case ISCSI_PARAM_DATASEQ_INORDER_EN:
2892 case ISCSI_PARAM_ERL:
2893 case ISCSI_PARAM_TARGET_NAME:
2894 case ISCSI_PARAM_TPGT:
2895 case ISCSI_PARAM_USERNAME:
2896 case ISCSI_PARAM_PASSWORD:
2897 case ISCSI_PARAM_USERNAME_IN:
2898 case ISCSI_PARAM_PASSWORD_IN:
2899 case ISCSI_PARAM_FAST_ABORT:
2900 case ISCSI_PARAM_ABORT_TMO:
2901 case ISCSI_PARAM_LU_RESET_TMO:
2902 case ISCSI_PARAM_TGT_RESET_TMO:
2903 case ISCSI_PARAM_IFACE_NAME:
2904 case ISCSI_PARAM_INITIATOR_NAME:
2905 return S_IRUGO;
2906 default:
2907 return 0;
2908 }
2909 }
2910
2911 return 0;
2912 }
2913 EXPORT_SYMBOL_GPL(cxgbi_attr_is_visible);
2914
2915 static int __init libcxgbi_init_module(void)
2916 {
2917 sw_tag_idx_bits = (__ilog2_u32(ISCSI_ITT_MASK)) + 1;
2918 sw_tag_age_bits = (__ilog2_u32(ISCSI_AGE_MASK)) + 1;
2919
2920 pr_info("%s", version);
2921
2922 pr_info("tag itt 0x%x, %u bits, age 0x%x, %u bits.\n",
2923 ISCSI_ITT_MASK, sw_tag_idx_bits,
2924 ISCSI_AGE_MASK, sw_tag_age_bits);
2925
2926 ddp_setup_host_page_size();
2927 return 0;
2928 }
2929
2930 static void __exit libcxgbi_exit_module(void)
2931 {
2932 cxgbi_device_unregister_all(0xFF);
2933 return;
2934 }
2935
2936 module_init(libcxgbi_init_module);
2937 module_exit(libcxgbi_exit_module);
This page took 0.12157 seconds and 6 git commands to generate.