[SCSI] iscsi_tcp, libiscsi: initial AHS Support
[deliverable/linux.git] / drivers / scsi / iscsi_tcp.c
1 /*
2 * iSCSI Initiator over TCP/IP Data-Path
3 *
4 * Copyright (C) 2004 Dmitry Yusupov
5 * Copyright (C) 2004 Alex Aizman
6 * Copyright (C) 2005 - 2006 Mike Christie
7 * Copyright (C) 2006 Red Hat, Inc. All rights reserved.
8 * maintained by open-iscsi@googlegroups.com
9 *
10 * This program is free software; you can redistribute it and/or modify
11 * it under the terms of the GNU General Public License as published
12 * by the Free Software Foundation; either version 2 of the License, or
13 * (at your option) any later version.
14 *
15 * This program is distributed in the hope that it will be useful, but
16 * WITHOUT ANY WARRANTY; without even the implied warranty of
17 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
18 * General Public License for more details.
19 *
20 * See the file COPYING included with this distribution for more details.
21 *
22 * Credits:
23 * Christoph Hellwig
24 * FUJITA Tomonori
25 * Arne Redlich
26 * Zhenyu Wang
27 */
28
29 #include <linux/types.h>
30 #include <linux/list.h>
31 #include <linux/inet.h>
32 #include <linux/file.h>
33 #include <linux/blkdev.h>
34 #include <linux/crypto.h>
35 #include <linux/delay.h>
36 #include <linux/kfifo.h>
37 #include <linux/scatterlist.h>
38 #include <net/tcp.h>
39 #include <scsi/scsi_cmnd.h>
40 #include <scsi/scsi_device.h>
41 #include <scsi/scsi_host.h>
42 #include <scsi/scsi.h>
43 #include <scsi/scsi_transport_iscsi.h>
44
45 #include "iscsi_tcp.h"
46
47 MODULE_AUTHOR("Dmitry Yusupov <dmitry_yus@yahoo.com>, "
48 "Alex Aizman <itn780@yahoo.com>");
49 MODULE_DESCRIPTION("iSCSI/TCP data-path");
50 MODULE_LICENSE("GPL");
51 #undef DEBUG_TCP
52 #define DEBUG_ASSERT
53
54 #ifdef DEBUG_TCP
55 #define debug_tcp(fmt...) printk(KERN_INFO "tcp: " fmt)
56 #else
57 #define debug_tcp(fmt...)
58 #endif
59
60 #ifndef DEBUG_ASSERT
61 #ifdef BUG_ON
62 #undef BUG_ON
63 #endif
64 #define BUG_ON(expr)
65 #endif
66
67 static unsigned int iscsi_max_lun = 512;
68 module_param_named(max_lun, iscsi_max_lun, uint, S_IRUGO);
69
70 static int iscsi_tcp_hdr_recv_done(struct iscsi_tcp_conn *tcp_conn,
71 struct iscsi_chunk *chunk);
72
73 static inline void
74 iscsi_buf_init_iov(struct iscsi_buf *ibuf, char *vbuf, int size)
75 {
76 ibuf->sg.page = virt_to_page(vbuf);
77 ibuf->sg.offset = offset_in_page(vbuf);
78 ibuf->sg.length = size;
79 ibuf->sent = 0;
80 ibuf->use_sendmsg = 1;
81 }
82
83 static inline void
84 iscsi_buf_init_sg(struct iscsi_buf *ibuf, struct scatterlist *sg)
85 {
86 ibuf->sg.page = sg->page;
87 ibuf->sg.offset = sg->offset;
88 ibuf->sg.length = sg->length;
89 /*
90 * Fastpath: sg element fits into single page
91 */
92 if (sg->length + sg->offset <= PAGE_SIZE && !PageSlab(sg->page))
93 ibuf->use_sendmsg = 0;
94 else
95 ibuf->use_sendmsg = 1;
96 ibuf->sent = 0;
97 }
98
99 static inline int
100 iscsi_buf_left(struct iscsi_buf *ibuf)
101 {
102 int rc;
103
104 rc = ibuf->sg.length - ibuf->sent;
105 BUG_ON(rc < 0);
106 return rc;
107 }
108
109 static inline void
110 iscsi_hdr_digest(struct iscsi_conn *conn, struct iscsi_buf *buf,
111 u8* crc)
112 {
113 struct iscsi_tcp_conn *tcp_conn = conn->dd_data;
114
115 crypto_hash_digest(&tcp_conn->tx_hash, &buf->sg, buf->sg.length, crc);
116 buf->sg.length += ISCSI_DIGEST_SIZE;
117 }
118
119 /*
120 * Scatterlist handling: inside the iscsi_chunk, we
121 * remember an index into the scatterlist, and set data/size
122 * to the current scatterlist entry. For highmem pages, we
123 * kmap as needed.
124 *
125 * Note that the page is unmapped when we return from
126 * TCP's data_ready handler, so we may end up mapping and
127 * unmapping the same page repeatedly. The whole reason
128 * for this is that we shouldn't keep the page mapped
129 * outside the softirq.
130 */
131
132 /**
133 * iscsi_tcp_chunk_init_sg - init indicated scatterlist entry
134 * @chunk: the buffer object
135 * @idx: index into scatterlist
136 * @offset: byte offset into that sg entry
137 *
138 * This function sets up the chunk so that subsequent
139 * data is copied to the indicated sg entry, at the given
140 * offset.
141 */
142 static inline void
143 iscsi_tcp_chunk_init_sg(struct iscsi_chunk *chunk,
144 unsigned int idx, unsigned int offset)
145 {
146 struct scatterlist *sg;
147
148 BUG_ON(chunk->sg == NULL);
149
150 sg = &chunk->sg[idx];
151 chunk->sg_index = idx;
152 chunk->sg_offset = offset;
153 chunk->size = min(sg->length - offset, chunk->total_size);
154 chunk->data = NULL;
155 }
156
157 /**
158 * iscsi_tcp_chunk_map - map the current S/G page
159 * @chunk: iscsi chunk
160 *
161 * We only need to possibly kmap data if scatter lists are being used,
162 * because the iscsi passthrough and internal IO paths will never use high
163 * mem pages.
164 */
165 static inline void
166 iscsi_tcp_chunk_map(struct iscsi_chunk *chunk)
167 {
168 struct scatterlist *sg;
169
170 if (chunk->data != NULL || !chunk->sg)
171 return;
172
173 sg = &chunk->sg[chunk->sg_index];
174 BUG_ON(chunk->sg_mapped);
175 BUG_ON(sg->length == 0);
176 chunk->sg_mapped = kmap_atomic(sg->page, KM_SOFTIRQ0);
177 chunk->data = chunk->sg_mapped + sg->offset + chunk->sg_offset;
178 }
179
180 static inline void
181 iscsi_tcp_chunk_unmap(struct iscsi_chunk *chunk)
182 {
183 if (chunk->sg_mapped) {
184 kunmap_atomic(chunk->sg_mapped, KM_SOFTIRQ0);
185 chunk->sg_mapped = NULL;
186 chunk->data = NULL;
187 }
188 }
189
190 /*
191 * Splice the digest buffer into the buffer
192 */
193 static inline void
194 iscsi_tcp_chunk_splice_digest(struct iscsi_chunk *chunk, void *digest)
195 {
196 chunk->data = digest;
197 chunk->digest_len = ISCSI_DIGEST_SIZE;
198 chunk->total_size += ISCSI_DIGEST_SIZE;
199 chunk->size = ISCSI_DIGEST_SIZE;
200 chunk->copied = 0;
201 chunk->sg = NULL;
202 chunk->sg_index = 0;
203 chunk->hash = NULL;
204 }
205
206 /**
207 * iscsi_tcp_chunk_done - check whether the chunk is complete
208 * @chunk: iscsi chunk to check
209 *
210 * Check if we're done receiving this chunk. If the receive
211 * buffer is full but we expect more data, move on to the
212 * next entry in the scatterlist.
213 *
214 * If the amount of data we received isn't a multiple of 4,
215 * we will transparently receive the pad bytes, too.
216 *
217 * This function must be re-entrant.
218 */
219 static inline int
220 iscsi_tcp_chunk_done(struct iscsi_chunk *chunk)
221 {
222 static unsigned char padbuf[ISCSI_PAD_LEN];
223 unsigned int pad;
224
225 if (chunk->copied < chunk->size) {
226 iscsi_tcp_chunk_map(chunk);
227 return 0;
228 }
229
230 chunk->total_copied += chunk->copied;
231 chunk->copied = 0;
232 chunk->size = 0;
233
234 /* Unmap the current scatterlist page, if there is one. */
235 iscsi_tcp_chunk_unmap(chunk);
236
237 /* Do we have more scatterlist entries? */
238 if (chunk->total_copied < chunk->total_size) {
239 /* Proceed to the next entry in the scatterlist. */
240 iscsi_tcp_chunk_init_sg(chunk, chunk->sg_index + 1, 0);
241 iscsi_tcp_chunk_map(chunk);
242 BUG_ON(chunk->size == 0);
243 return 0;
244 }
245
246 /* Do we need to handle padding? */
247 pad = iscsi_padding(chunk->total_copied);
248 if (pad != 0) {
249 debug_tcp("consume %d pad bytes\n", pad);
250 chunk->total_size += pad;
251 chunk->size = pad;
252 chunk->data = padbuf;
253 return 0;
254 }
255
256 /*
257 * Set us up for receiving the data digest. hdr digest
258 * is completely handled in hdr done function.
259 */
260 if (chunk->hash) {
261 if (chunk->digest_len == 0) {
262 crypto_hash_final(chunk->hash, chunk->digest);
263 iscsi_tcp_chunk_splice_digest(chunk,
264 chunk->recv_digest);
265 return 0;
266 }
267 }
268
269 return 1;
270 }
271
272 /**
273 * iscsi_tcp_chunk_recv - copy data to chunk
274 * @tcp_conn: the iSCSI TCP connection
275 * @chunk: the buffer to copy to
276 * @ptr: data pointer
277 * @len: amount of data available
278 *
279 * This function copies up to @len bytes to the
280 * given buffer, and returns the number of bytes
281 * consumed, which can actually be less than @len.
282 *
283 * If hash digest is enabled, the function will update the
284 * hash while copying.
285 * Combining these two operations doesn't buy us a lot (yet),
286 * but in the future we could implement combined copy+crc,
287 * just way we do for network layer checksums.
288 */
289 static int
290 iscsi_tcp_chunk_recv(struct iscsi_tcp_conn *tcp_conn,
291 struct iscsi_chunk *chunk, const void *ptr,
292 unsigned int len)
293 {
294 struct scatterlist sg;
295 unsigned int copy, copied = 0;
296
297 while (!iscsi_tcp_chunk_done(chunk)) {
298 if (copied == len)
299 goto out;
300
301 copy = min(len - copied, chunk->size - chunk->copied);
302 memcpy(chunk->data + chunk->copied, ptr + copied, copy);
303
304 if (chunk->hash) {
305 sg_init_one(&sg, ptr + copied, copy);
306 crypto_hash_update(chunk->hash, &sg, copy);
307 }
308 chunk->copied += copy;
309 copied += copy;
310 }
311
312 out:
313 return copied;
314 }
315
316 static inline void
317 iscsi_tcp_dgst_header(struct hash_desc *hash, const void *hdr, size_t hdrlen,
318 unsigned char digest[ISCSI_DIGEST_SIZE])
319 {
320 struct scatterlist sg;
321
322 sg_init_one(&sg, hdr, hdrlen);
323 crypto_hash_digest(hash, &sg, hdrlen, digest);
324 }
325
326 static inline int
327 iscsi_tcp_dgst_verify(struct iscsi_tcp_conn *tcp_conn,
328 struct iscsi_chunk *chunk)
329 {
330 if (!chunk->digest_len)
331 return 1;
332
333 if (memcmp(chunk->recv_digest, chunk->digest, chunk->digest_len)) {
334 debug_scsi("digest mismatch\n");
335 return 0;
336 }
337
338 return 1;
339 }
340
341 /*
342 * Helper function to set up chunk buffer
343 */
344 static inline void
345 __iscsi_chunk_init(struct iscsi_chunk *chunk, size_t size,
346 iscsi_chunk_done_fn_t *done, struct hash_desc *hash)
347 {
348 memset(chunk, 0, sizeof(*chunk));
349 chunk->total_size = size;
350 chunk->done = done;
351
352 if (hash) {
353 chunk->hash = hash;
354 crypto_hash_init(hash);
355 }
356 }
357
358 static inline void
359 iscsi_chunk_init_linear(struct iscsi_chunk *chunk, void *data, size_t size,
360 iscsi_chunk_done_fn_t *done, struct hash_desc *hash)
361 {
362 __iscsi_chunk_init(chunk, size, done, hash);
363 chunk->data = data;
364 chunk->size = size;
365 }
366
367 static inline int
368 iscsi_chunk_seek_sg(struct iscsi_chunk *chunk,
369 struct scatterlist *sg, unsigned int sg_count,
370 unsigned int offset, size_t size,
371 iscsi_chunk_done_fn_t *done, struct hash_desc *hash)
372 {
373 unsigned int i;
374
375 __iscsi_chunk_init(chunk, size, done, hash);
376 for (i = 0; i < sg_count; ++i) {
377 if (offset < sg[i].length) {
378 chunk->sg = sg;
379 chunk->sg_count = sg_count;
380 iscsi_tcp_chunk_init_sg(chunk, i, offset);
381 return 0;
382 }
383 offset -= sg[i].length;
384 }
385
386 return ISCSI_ERR_DATA_OFFSET;
387 }
388
389 /**
390 * iscsi_tcp_hdr_recv_prep - prep chunk for hdr reception
391 * @tcp_conn: iscsi connection to prep for
392 *
393 * This function always passes NULL for the hash argument, because when this
394 * function is called we do not yet know the final size of the header and want
395 * to delay the digest processing until we know that.
396 */
397 static void
398 iscsi_tcp_hdr_recv_prep(struct iscsi_tcp_conn *tcp_conn)
399 {
400 debug_tcp("iscsi_tcp_hdr_recv_prep(%p%s)\n", tcp_conn,
401 tcp_conn->iscsi_conn->hdrdgst_en ? ", digest enabled" : "");
402 iscsi_chunk_init_linear(&tcp_conn->in.chunk,
403 tcp_conn->in.hdr_buf, sizeof(struct iscsi_hdr),
404 iscsi_tcp_hdr_recv_done, NULL);
405 }
406
407 /*
408 * Handle incoming reply to any other type of command
409 */
410 static int
411 iscsi_tcp_data_recv_done(struct iscsi_tcp_conn *tcp_conn,
412 struct iscsi_chunk *chunk)
413 {
414 struct iscsi_conn *conn = tcp_conn->iscsi_conn;
415 int rc = 0;
416
417 if (!iscsi_tcp_dgst_verify(tcp_conn, chunk))
418 return ISCSI_ERR_DATA_DGST;
419
420 rc = iscsi_complete_pdu(conn, tcp_conn->in.hdr,
421 conn->data, tcp_conn->in.datalen);
422 if (rc)
423 return rc;
424
425 iscsi_tcp_hdr_recv_prep(tcp_conn);
426 return 0;
427 }
428
429 static void
430 iscsi_tcp_data_recv_prep(struct iscsi_tcp_conn *tcp_conn)
431 {
432 struct iscsi_conn *conn = tcp_conn->iscsi_conn;
433 struct hash_desc *rx_hash = NULL;
434
435 if (conn->datadgst_en)
436 rx_hash = &tcp_conn->rx_hash;
437
438 iscsi_chunk_init_linear(&tcp_conn->in.chunk,
439 conn->data, tcp_conn->in.datalen,
440 iscsi_tcp_data_recv_done, rx_hash);
441 }
442
443 /*
444 * must be called with session lock
445 */
446 static void
447 iscsi_tcp_cleanup_ctask(struct iscsi_conn *conn, struct iscsi_cmd_task *ctask)
448 {
449 struct iscsi_tcp_cmd_task *tcp_ctask = ctask->dd_data;
450 struct iscsi_r2t_info *r2t;
451 struct scsi_cmnd *sc;
452
453 /* flush ctask's r2t queues */
454 while (__kfifo_get(tcp_ctask->r2tqueue, (void*)&r2t, sizeof(void*))) {
455 __kfifo_put(tcp_ctask->r2tpool.queue, (void*)&r2t,
456 sizeof(void*));
457 debug_scsi("iscsi_tcp_cleanup_ctask pending r2t dropped\n");
458 }
459
460 sc = ctask->sc;
461 if (unlikely(!sc))
462 return;
463
464 tcp_ctask->xmstate = XMSTATE_IDLE;
465 tcp_ctask->r2t = NULL;
466 }
467
468 /**
469 * iscsi_data_rsp - SCSI Data-In Response processing
470 * @conn: iscsi connection
471 * @ctask: scsi command task
472 **/
473 static int
474 iscsi_data_rsp(struct iscsi_conn *conn, struct iscsi_cmd_task *ctask)
475 {
476 struct iscsi_tcp_conn *tcp_conn = conn->dd_data;
477 struct iscsi_tcp_cmd_task *tcp_ctask = ctask->dd_data;
478 struct iscsi_data_rsp *rhdr = (struct iscsi_data_rsp *)tcp_conn->in.hdr;
479 struct iscsi_session *session = conn->session;
480 struct scsi_cmnd *sc = ctask->sc;
481 int datasn = be32_to_cpu(rhdr->datasn);
482
483 iscsi_update_cmdsn(session, (struct iscsi_nopin*)rhdr);
484 /*
485 * setup Data-In byte counter (gets decremented..)
486 */
487 ctask->data_count = tcp_conn->in.datalen;
488
489 if (tcp_conn->in.datalen == 0)
490 return 0;
491
492 if (tcp_ctask->exp_datasn != datasn) {
493 debug_tcp("%s: ctask->exp_datasn(%d) != rhdr->datasn(%d)\n",
494 __FUNCTION__, tcp_ctask->exp_datasn, datasn);
495 return ISCSI_ERR_DATASN;
496 }
497
498 tcp_ctask->exp_datasn++;
499
500 tcp_ctask->data_offset = be32_to_cpu(rhdr->offset);
501 if (tcp_ctask->data_offset + tcp_conn->in.datalen > scsi_bufflen(sc)) {
502 debug_tcp("%s: data_offset(%d) + data_len(%d) > total_length_in(%d)\n",
503 __FUNCTION__, tcp_ctask->data_offset,
504 tcp_conn->in.datalen, scsi_bufflen(sc));
505 return ISCSI_ERR_DATA_OFFSET;
506 }
507
508 if (rhdr->flags & ISCSI_FLAG_DATA_STATUS) {
509 sc->result = (DID_OK << 16) | rhdr->cmd_status;
510 conn->exp_statsn = be32_to_cpu(rhdr->statsn) + 1;
511 if (rhdr->flags & (ISCSI_FLAG_DATA_UNDERFLOW |
512 ISCSI_FLAG_DATA_OVERFLOW)) {
513 int res_count = be32_to_cpu(rhdr->residual_count);
514
515 if (res_count > 0 &&
516 (rhdr->flags & ISCSI_FLAG_CMD_OVERFLOW ||
517 res_count <= scsi_bufflen(sc)))
518 scsi_set_resid(sc, res_count);
519 else
520 sc->result = (DID_BAD_TARGET << 16) |
521 rhdr->cmd_status;
522 }
523 }
524
525 conn->datain_pdus_cnt++;
526 return 0;
527 }
528
529 /**
530 * iscsi_solicit_data_init - initialize first Data-Out
531 * @conn: iscsi connection
532 * @ctask: scsi command task
533 * @r2t: R2T info
534 *
535 * Notes:
536 * Initialize first Data-Out within this R2T sequence and finds
537 * proper data_offset within this SCSI command.
538 *
539 * This function is called with connection lock taken.
540 **/
541 static void
542 iscsi_solicit_data_init(struct iscsi_conn *conn, struct iscsi_cmd_task *ctask,
543 struct iscsi_r2t_info *r2t)
544 {
545 struct iscsi_data *hdr;
546 struct scsi_cmnd *sc = ctask->sc;
547 int i, sg_count = 0;
548 struct scatterlist *sg;
549
550 hdr = &r2t->dtask.hdr;
551 memset(hdr, 0, sizeof(struct iscsi_data));
552 hdr->ttt = r2t->ttt;
553 hdr->datasn = cpu_to_be32(r2t->solicit_datasn);
554 r2t->solicit_datasn++;
555 hdr->opcode = ISCSI_OP_SCSI_DATA_OUT;
556 memcpy(hdr->lun, ctask->hdr->lun, sizeof(hdr->lun));
557 hdr->itt = ctask->hdr->itt;
558 hdr->exp_statsn = r2t->exp_statsn;
559 hdr->offset = cpu_to_be32(r2t->data_offset);
560 if (r2t->data_length > conn->max_xmit_dlength) {
561 hton24(hdr->dlength, conn->max_xmit_dlength);
562 r2t->data_count = conn->max_xmit_dlength;
563 hdr->flags = 0;
564 } else {
565 hton24(hdr->dlength, r2t->data_length);
566 r2t->data_count = r2t->data_length;
567 hdr->flags = ISCSI_FLAG_CMD_FINAL;
568 }
569 conn->dataout_pdus_cnt++;
570
571 r2t->sent = 0;
572
573 iscsi_buf_init_iov(&r2t->headbuf, (char*)hdr,
574 sizeof(struct iscsi_hdr));
575
576 sg = scsi_sglist(sc);
577 r2t->sg = NULL;
578 for (i = 0; i < scsi_sg_count(sc); i++, sg += 1) {
579 /* FIXME: prefetch ? */
580 if (sg_count + sg->length > r2t->data_offset) {
581 int page_offset;
582
583 /* sg page found! */
584
585 /* offset within this page */
586 page_offset = r2t->data_offset - sg_count;
587
588 /* fill in this buffer */
589 iscsi_buf_init_sg(&r2t->sendbuf, sg);
590 r2t->sendbuf.sg.offset += page_offset;
591 r2t->sendbuf.sg.length -= page_offset;
592
593 /* xmit logic will continue with next one */
594 r2t->sg = sg + 1;
595 break;
596 }
597 sg_count += sg->length;
598 }
599 BUG_ON(r2t->sg == NULL);
600 }
601
602 /**
603 * iscsi_r2t_rsp - iSCSI R2T Response processing
604 * @conn: iscsi connection
605 * @ctask: scsi command task
606 **/
607 static int
608 iscsi_r2t_rsp(struct iscsi_conn *conn, struct iscsi_cmd_task *ctask)
609 {
610 struct iscsi_r2t_info *r2t;
611 struct iscsi_session *session = conn->session;
612 struct iscsi_tcp_cmd_task *tcp_ctask = ctask->dd_data;
613 struct iscsi_tcp_conn *tcp_conn = conn->dd_data;
614 struct iscsi_r2t_rsp *rhdr = (struct iscsi_r2t_rsp *)tcp_conn->in.hdr;
615 int r2tsn = be32_to_cpu(rhdr->r2tsn);
616 int rc;
617
618 if (tcp_conn->in.datalen) {
619 printk(KERN_ERR "iscsi_tcp: invalid R2t with datalen %d\n",
620 tcp_conn->in.datalen);
621 return ISCSI_ERR_DATALEN;
622 }
623
624 if (tcp_ctask->exp_datasn != r2tsn){
625 debug_tcp("%s: ctask->exp_datasn(%d) != rhdr->r2tsn(%d)\n",
626 __FUNCTION__, tcp_ctask->exp_datasn, r2tsn);
627 return ISCSI_ERR_R2TSN;
628 }
629
630 /* fill-in new R2T associated with the task */
631 spin_lock(&session->lock);
632 iscsi_update_cmdsn(session, (struct iscsi_nopin*)rhdr);
633
634 if (!ctask->sc || session->state != ISCSI_STATE_LOGGED_IN) {
635 printk(KERN_INFO "iscsi_tcp: dropping R2T itt %d in "
636 "recovery...\n", ctask->itt);
637 spin_unlock(&session->lock);
638 return 0;
639 }
640
641 rc = __kfifo_get(tcp_ctask->r2tpool.queue, (void*)&r2t, sizeof(void*));
642 BUG_ON(!rc);
643
644 r2t->exp_statsn = rhdr->statsn;
645 r2t->data_length = be32_to_cpu(rhdr->data_length);
646 if (r2t->data_length == 0) {
647 printk(KERN_ERR "iscsi_tcp: invalid R2T with zero data len\n");
648 spin_unlock(&session->lock);
649 return ISCSI_ERR_DATALEN;
650 }
651
652 if (r2t->data_length > session->max_burst)
653 debug_scsi("invalid R2T with data len %u and max burst %u."
654 "Attempting to execute request.\n",
655 r2t->data_length, session->max_burst);
656
657 r2t->data_offset = be32_to_cpu(rhdr->data_offset);
658 if (r2t->data_offset + r2t->data_length > scsi_bufflen(ctask->sc)) {
659 spin_unlock(&session->lock);
660 printk(KERN_ERR "iscsi_tcp: invalid R2T with data len %u at "
661 "offset %u and total length %d\n", r2t->data_length,
662 r2t->data_offset, scsi_bufflen(ctask->sc));
663 return ISCSI_ERR_DATALEN;
664 }
665
666 r2t->ttt = rhdr->ttt; /* no flip */
667 r2t->solicit_datasn = 0;
668
669 iscsi_solicit_data_init(conn, ctask, r2t);
670
671 tcp_ctask->exp_datasn = r2tsn + 1;
672 __kfifo_put(tcp_ctask->r2tqueue, (void*)&r2t, sizeof(void*));
673 tcp_ctask->xmstate |= XMSTATE_SOL_HDR_INIT;
674 conn->r2t_pdus_cnt++;
675
676 iscsi_requeue_ctask(ctask);
677 spin_unlock(&session->lock);
678
679 return 0;
680 }
681
682 /*
683 * Handle incoming reply to DataIn command
684 */
685 static int
686 iscsi_tcp_process_data_in(struct iscsi_tcp_conn *tcp_conn,
687 struct iscsi_chunk *chunk)
688 {
689 struct iscsi_conn *conn = tcp_conn->iscsi_conn;
690 struct iscsi_hdr *hdr = tcp_conn->in.hdr;
691 int rc;
692
693 if (!iscsi_tcp_dgst_verify(tcp_conn, chunk))
694 return ISCSI_ERR_DATA_DGST;
695
696 /* check for non-exceptional status */
697 if (hdr->flags & ISCSI_FLAG_DATA_STATUS) {
698 rc = iscsi_complete_pdu(conn, tcp_conn->in.hdr, NULL, 0);
699 if (rc)
700 return rc;
701 }
702
703 iscsi_tcp_hdr_recv_prep(tcp_conn);
704 return 0;
705 }
706
707 /**
708 * iscsi_tcp_hdr_dissect - process PDU header
709 * @conn: iSCSI connection
710 * @hdr: PDU header
711 *
712 * This function analyzes the header of the PDU received,
713 * and performs several sanity checks. If the PDU is accompanied
714 * by data, the receive buffer is set up to copy the incoming data
715 * to the correct location.
716 */
717 static int
718 iscsi_tcp_hdr_dissect(struct iscsi_conn *conn, struct iscsi_hdr *hdr)
719 {
720 int rc = 0, opcode, ahslen;
721 struct iscsi_session *session = conn->session;
722 struct iscsi_tcp_conn *tcp_conn = conn->dd_data;
723 struct iscsi_cmd_task *ctask;
724 uint32_t itt;
725
726 /* verify PDU length */
727 tcp_conn->in.datalen = ntoh24(hdr->dlength);
728 if (tcp_conn->in.datalen > conn->max_recv_dlength) {
729 printk(KERN_ERR "iscsi_tcp: datalen %d > %d\n",
730 tcp_conn->in.datalen, conn->max_recv_dlength);
731 return ISCSI_ERR_DATALEN;
732 }
733
734 /* Additional header segments. So far, we don't
735 * process additional headers.
736 */
737 ahslen = hdr->hlength << 2;
738
739 opcode = hdr->opcode & ISCSI_OPCODE_MASK;
740 /* verify itt (itt encoding: age+cid+itt) */
741 rc = iscsi_verify_itt(conn, hdr, &itt);
742 if (rc == ISCSI_ERR_NO_SCSI_CMD) {
743 /* XXX: what does this do? */
744 tcp_conn->in.datalen = 0; /* force drop */
745 return 0;
746 } else if (rc)
747 return rc;
748
749 debug_tcp("opcode 0x%x ahslen %d datalen %d\n",
750 opcode, ahslen, tcp_conn->in.datalen);
751
752 switch(opcode) {
753 case ISCSI_OP_SCSI_DATA_IN:
754 ctask = session->cmds[itt];
755 rc = iscsi_data_rsp(conn, ctask);
756 if (rc)
757 return rc;
758 if (tcp_conn->in.datalen) {
759 struct iscsi_tcp_cmd_task *tcp_ctask = ctask->dd_data;
760 struct hash_desc *rx_hash = NULL;
761
762 /*
763 * Setup copy of Data-In into the Scsi_Cmnd
764 * Scatterlist case:
765 * We set up the iscsi_chunk to point to the next
766 * scatterlist entry to copy to. As we go along,
767 * we move on to the next scatterlist entry and
768 * update the digest per-entry.
769 */
770 if (conn->datadgst_en)
771 rx_hash = &tcp_conn->rx_hash;
772
773 debug_tcp("iscsi_tcp_begin_data_in(%p, offset=%d, "
774 "datalen=%d)\n", tcp_conn,
775 tcp_ctask->data_offset,
776 tcp_conn->in.datalen);
777 return iscsi_chunk_seek_sg(&tcp_conn->in.chunk,
778 scsi_sglist(ctask->sc),
779 scsi_sg_count(ctask->sc),
780 tcp_ctask->data_offset,
781 tcp_conn->in.datalen,
782 iscsi_tcp_process_data_in,
783 rx_hash);
784 }
785 /* fall through */
786 case ISCSI_OP_SCSI_CMD_RSP:
787 if (tcp_conn->in.datalen) {
788 iscsi_tcp_data_recv_prep(tcp_conn);
789 return 0;
790 }
791 rc = iscsi_complete_pdu(conn, hdr, NULL, 0);
792 break;
793 case ISCSI_OP_R2T:
794 ctask = session->cmds[itt];
795 if (ahslen)
796 rc = ISCSI_ERR_AHSLEN;
797 else if (ctask->sc->sc_data_direction == DMA_TO_DEVICE)
798 rc = iscsi_r2t_rsp(conn, ctask);
799 else
800 rc = ISCSI_ERR_PROTO;
801 break;
802 case ISCSI_OP_LOGIN_RSP:
803 case ISCSI_OP_TEXT_RSP:
804 case ISCSI_OP_REJECT:
805 case ISCSI_OP_ASYNC_EVENT:
806 /*
807 * It is possible that we could get a PDU with a buffer larger
808 * than 8K, but there are no targets that currently do this.
809 * For now we fail until we find a vendor that needs it
810 */
811 if (ISCSI_DEF_MAX_RECV_SEG_LEN < tcp_conn->in.datalen) {
812 printk(KERN_ERR "iscsi_tcp: received buffer of len %u "
813 "but conn buffer is only %u (opcode %0x)\n",
814 tcp_conn->in.datalen,
815 ISCSI_DEF_MAX_RECV_SEG_LEN, opcode);
816 rc = ISCSI_ERR_PROTO;
817 break;
818 }
819
820 /* If there's data coming in with the response,
821 * receive it to the connection's buffer.
822 */
823 if (tcp_conn->in.datalen) {
824 iscsi_tcp_data_recv_prep(tcp_conn);
825 return 0;
826 }
827 /* fall through */
828 case ISCSI_OP_LOGOUT_RSP:
829 case ISCSI_OP_NOOP_IN:
830 case ISCSI_OP_SCSI_TMFUNC_RSP:
831 rc = iscsi_complete_pdu(conn, hdr, NULL, 0);
832 break;
833 default:
834 rc = ISCSI_ERR_BAD_OPCODE;
835 break;
836 }
837
838 if (rc == 0) {
839 /* Anything that comes with data should have
840 * been handled above. */
841 if (tcp_conn->in.datalen)
842 return ISCSI_ERR_PROTO;
843 iscsi_tcp_hdr_recv_prep(tcp_conn);
844 }
845
846 return rc;
847 }
848
849 static inline void
850 partial_sg_digest_update(struct hash_desc *desc, struct scatterlist *sg,
851 int offset, int length)
852 {
853 struct scatterlist temp;
854
855 sg_init_table(&temp, 1);
856 sg_set_page(&temp, sg_page(sg), length, offset);
857 crypto_hash_update(desc, &temp, length);
858 }
859
860 /**
861 * iscsi_tcp_hdr_recv_done - process PDU header
862 *
863 * This is the callback invoked when the PDU header has
864 * been received. If the header is followed by additional
865 * header segments, we go back for more data.
866 */
867 static int
868 iscsi_tcp_hdr_recv_done(struct iscsi_tcp_conn *tcp_conn,
869 struct iscsi_chunk *chunk)
870 {
871 struct iscsi_conn *conn = tcp_conn->iscsi_conn;
872 struct iscsi_hdr *hdr;
873
874 /* Check if there are additional header segments
875 * *prior* to computing the digest, because we
876 * may need to go back to the caller for more.
877 */
878 hdr = (struct iscsi_hdr *) tcp_conn->in.hdr_buf;
879 if (chunk->copied == sizeof(struct iscsi_hdr) && hdr->hlength) {
880 /* Bump the header length - the caller will
881 * just loop around and get the AHS for us, and
882 * call again. */
883 unsigned int ahslen = hdr->hlength << 2;
884
885 /* Make sure we don't overflow */
886 if (sizeof(*hdr) + ahslen > sizeof(tcp_conn->in.hdr_buf))
887 return ISCSI_ERR_AHSLEN;
888
889 chunk->total_size += ahslen;
890 chunk->size += ahslen;
891 return 0;
892 }
893
894 /* We're done processing the header. See if we're doing
895 * header digests; if so, set up the recv_digest buffer
896 * and go back for more. */
897 if (conn->hdrdgst_en) {
898 if (chunk->digest_len == 0) {
899 iscsi_tcp_chunk_splice_digest(chunk,
900 chunk->recv_digest);
901 return 0;
902 }
903 iscsi_tcp_dgst_header(&tcp_conn->rx_hash, hdr,
904 chunk->total_copied - ISCSI_DIGEST_SIZE,
905 chunk->digest);
906
907 if (!iscsi_tcp_dgst_verify(tcp_conn, chunk))
908 return ISCSI_ERR_HDR_DGST;
909 }
910
911 tcp_conn->in.hdr = hdr;
912 return iscsi_tcp_hdr_dissect(conn, hdr);
913 }
914
915 /**
916 * iscsi_tcp_recv - TCP receive in sendfile fashion
917 * @rd_desc: read descriptor
918 * @skb: socket buffer
919 * @offset: offset in skb
920 * @len: skb->len - offset
921 **/
922 static int
923 iscsi_tcp_recv(read_descriptor_t *rd_desc, struct sk_buff *skb,
924 unsigned int offset, size_t len)
925 {
926 struct iscsi_conn *conn = rd_desc->arg.data;
927 struct iscsi_tcp_conn *tcp_conn = conn->dd_data;
928 struct iscsi_chunk *chunk = &tcp_conn->in.chunk;
929 struct skb_seq_state seq;
930 unsigned int consumed = 0;
931 int rc = 0;
932
933 debug_tcp("in %d bytes\n", skb->len - offset);
934
935 if (unlikely(conn->suspend_rx)) {
936 debug_tcp("conn %d Rx suspended!\n", conn->id);
937 return 0;
938 }
939
940 skb_prepare_seq_read(skb, offset, skb->len, &seq);
941 while (1) {
942 unsigned int avail;
943 const u8 *ptr;
944
945 avail = skb_seq_read(consumed, &ptr, &seq);
946 if (avail == 0)
947 break;
948 BUG_ON(chunk->copied >= chunk->size);
949
950 debug_tcp("skb %p ptr=%p avail=%u\n", skb, ptr, avail);
951 rc = iscsi_tcp_chunk_recv(tcp_conn, chunk, ptr, avail);
952 BUG_ON(rc == 0);
953 consumed += rc;
954
955 if (chunk->total_copied >= chunk->total_size) {
956 rc = chunk->done(tcp_conn, chunk);
957 if (rc != 0) {
958 skb_abort_seq_read(&seq);
959 goto error;
960 }
961
962 /* The done() functions sets up the
963 * next chunk. */
964 }
965 }
966
967 conn->rxdata_octets += consumed;
968 return consumed;
969
970 error:
971 debug_tcp("Error receiving PDU, errno=%d\n", rc);
972 iscsi_conn_failure(conn, ISCSI_ERR_CONN_FAILED);
973 return 0;
974 }
975
976 static void
977 iscsi_tcp_data_ready(struct sock *sk, int flag)
978 {
979 struct iscsi_conn *conn = sk->sk_user_data;
980 struct iscsi_tcp_conn *tcp_conn = conn->dd_data;
981 read_descriptor_t rd_desc;
982
983 read_lock(&sk->sk_callback_lock);
984
985 /*
986 * Use rd_desc to pass 'conn' to iscsi_tcp_recv.
987 * We set count to 1 because we want the network layer to
988 * hand us all the skbs that are available. iscsi_tcp_recv
989 * handled pdus that cross buffers or pdus that still need data.
990 */
991 rd_desc.arg.data = conn;
992 rd_desc.count = 1;
993 tcp_read_sock(sk, &rd_desc, iscsi_tcp_recv);
994
995 read_unlock(&sk->sk_callback_lock);
996
997 /* If we had to (atomically) map a highmem page,
998 * unmap it now. */
999 iscsi_tcp_chunk_unmap(&tcp_conn->in.chunk);
1000 }
1001
1002 static void
1003 iscsi_tcp_state_change(struct sock *sk)
1004 {
1005 struct iscsi_tcp_conn *tcp_conn;
1006 struct iscsi_conn *conn;
1007 struct iscsi_session *session;
1008 void (*old_state_change)(struct sock *);
1009
1010 read_lock(&sk->sk_callback_lock);
1011
1012 conn = (struct iscsi_conn*)sk->sk_user_data;
1013 session = conn->session;
1014
1015 if ((sk->sk_state == TCP_CLOSE_WAIT ||
1016 sk->sk_state == TCP_CLOSE) &&
1017 !atomic_read(&sk->sk_rmem_alloc)) {
1018 debug_tcp("iscsi_tcp_state_change: TCP_CLOSE|TCP_CLOSE_WAIT\n");
1019 iscsi_conn_failure(conn, ISCSI_ERR_CONN_FAILED);
1020 }
1021
1022 tcp_conn = conn->dd_data;
1023 old_state_change = tcp_conn->old_state_change;
1024
1025 read_unlock(&sk->sk_callback_lock);
1026
1027 old_state_change(sk);
1028 }
1029
1030 /**
1031 * iscsi_write_space - Called when more output buffer space is available
1032 * @sk: socket space is available for
1033 **/
1034 static void
1035 iscsi_write_space(struct sock *sk)
1036 {
1037 struct iscsi_conn *conn = (struct iscsi_conn*)sk->sk_user_data;
1038 struct iscsi_tcp_conn *tcp_conn = conn->dd_data;
1039
1040 tcp_conn->old_write_space(sk);
1041 debug_tcp("iscsi_write_space: cid %d\n", conn->id);
1042 scsi_queue_work(conn->session->host, &conn->xmitwork);
1043 }
1044
1045 static void
1046 iscsi_conn_set_callbacks(struct iscsi_conn *conn)
1047 {
1048 struct iscsi_tcp_conn *tcp_conn = conn->dd_data;
1049 struct sock *sk = tcp_conn->sock->sk;
1050
1051 /* assign new callbacks */
1052 write_lock_bh(&sk->sk_callback_lock);
1053 sk->sk_user_data = conn;
1054 tcp_conn->old_data_ready = sk->sk_data_ready;
1055 tcp_conn->old_state_change = sk->sk_state_change;
1056 tcp_conn->old_write_space = sk->sk_write_space;
1057 sk->sk_data_ready = iscsi_tcp_data_ready;
1058 sk->sk_state_change = iscsi_tcp_state_change;
1059 sk->sk_write_space = iscsi_write_space;
1060 write_unlock_bh(&sk->sk_callback_lock);
1061 }
1062
1063 static void
1064 iscsi_conn_restore_callbacks(struct iscsi_tcp_conn *tcp_conn)
1065 {
1066 struct sock *sk = tcp_conn->sock->sk;
1067
1068 /* restore socket callbacks, see also: iscsi_conn_set_callbacks() */
1069 write_lock_bh(&sk->sk_callback_lock);
1070 sk->sk_user_data = NULL;
1071 sk->sk_data_ready = tcp_conn->old_data_ready;
1072 sk->sk_state_change = tcp_conn->old_state_change;
1073 sk->sk_write_space = tcp_conn->old_write_space;
1074 sk->sk_no_check = 0;
1075 write_unlock_bh(&sk->sk_callback_lock);
1076 }
1077
1078 /**
1079 * iscsi_send - generic send routine
1080 * @sk: kernel's socket
1081 * @buf: buffer to write from
1082 * @size: actual size to write
1083 * @flags: socket's flags
1084 */
1085 static inline int
1086 iscsi_send(struct iscsi_conn *conn, struct iscsi_buf *buf, int size, int flags)
1087 {
1088 struct iscsi_tcp_conn *tcp_conn = conn->dd_data;
1089 struct socket *sk = tcp_conn->sock;
1090 int offset = buf->sg.offset + buf->sent, res;
1091
1092 /*
1093 * if we got use_sg=0 or are sending something we kmallocd
1094 * then we did not have to do kmap (kmap returns page_address)
1095 *
1096 * if we got use_sg > 0, but had to drop down, we do not
1097 * set clustering so this should only happen for that
1098 * slab case.
1099 */
1100 if (buf->use_sendmsg)
1101 res = sock_no_sendpage(sk, buf->sg.page, offset, size, flags);
1102 else
1103 res = tcp_conn->sendpage(sk, buf->sg.page, offset, size, flags);
1104
1105 if (res >= 0) {
1106 conn->txdata_octets += res;
1107 buf->sent += res;
1108 return res;
1109 }
1110
1111 tcp_conn->sendpage_failures_cnt++;
1112 if (res == -EAGAIN)
1113 res = -ENOBUFS;
1114 else
1115 iscsi_conn_failure(conn, ISCSI_ERR_CONN_FAILED);
1116 return res;
1117 }
1118
1119 /**
1120 * iscsi_sendhdr - send PDU Header via tcp_sendpage()
1121 * @conn: iscsi connection
1122 * @buf: buffer to write from
1123 * @datalen: lenght of data to be sent after the header
1124 *
1125 * Notes:
1126 * (Tx, Fast Path)
1127 **/
1128 static inline int
1129 iscsi_sendhdr(struct iscsi_conn *conn, struct iscsi_buf *buf, int datalen)
1130 {
1131 int flags = 0; /* MSG_DONTWAIT; */
1132 int res, size;
1133
1134 size = buf->sg.length - buf->sent;
1135 BUG_ON(buf->sent + size > buf->sg.length);
1136 if (buf->sent + size != buf->sg.length || datalen)
1137 flags |= MSG_MORE;
1138
1139 res = iscsi_send(conn, buf, size, flags);
1140 debug_tcp("sendhdr %d bytes, sent %d res %d\n", size, buf->sent, res);
1141 if (res >= 0) {
1142 if (size != res)
1143 return -EAGAIN;
1144 return 0;
1145 }
1146
1147 return res;
1148 }
1149
1150 /**
1151 * iscsi_sendpage - send one page of iSCSI Data-Out.
1152 * @conn: iscsi connection
1153 * @buf: buffer to write from
1154 * @count: remaining data
1155 * @sent: number of bytes sent
1156 *
1157 * Notes:
1158 * (Tx, Fast Path)
1159 **/
1160 static inline int
1161 iscsi_sendpage(struct iscsi_conn *conn, struct iscsi_buf *buf,
1162 int *count, int *sent)
1163 {
1164 int flags = 0; /* MSG_DONTWAIT; */
1165 int res, size;
1166
1167 size = buf->sg.length - buf->sent;
1168 BUG_ON(buf->sent + size > buf->sg.length);
1169 if (size > *count)
1170 size = *count;
1171 if (buf->sent + size != buf->sg.length || *count != size)
1172 flags |= MSG_MORE;
1173
1174 res = iscsi_send(conn, buf, size, flags);
1175 debug_tcp("sendpage: %d bytes, sent %d left %d sent %d res %d\n",
1176 size, buf->sent, *count, *sent, res);
1177 if (res >= 0) {
1178 *count -= res;
1179 *sent += res;
1180 if (size != res)
1181 return -EAGAIN;
1182 return 0;
1183 }
1184
1185 return res;
1186 }
1187
1188 static inline void
1189 iscsi_data_digest_init(struct iscsi_tcp_conn *tcp_conn,
1190 struct iscsi_tcp_cmd_task *tcp_ctask)
1191 {
1192 crypto_hash_init(&tcp_conn->tx_hash);
1193 tcp_ctask->digest_count = 4;
1194 }
1195
1196 /**
1197 * iscsi_solicit_data_cont - initialize next Data-Out
1198 * @conn: iscsi connection
1199 * @ctask: scsi command task
1200 * @r2t: R2T info
1201 * @left: bytes left to transfer
1202 *
1203 * Notes:
1204 * Initialize next Data-Out within this R2T sequence and continue
1205 * to process next Scatter-Gather element(if any) of this SCSI command.
1206 *
1207 * Called under connection lock.
1208 **/
1209 static void
1210 iscsi_solicit_data_cont(struct iscsi_conn *conn, struct iscsi_cmd_task *ctask,
1211 struct iscsi_r2t_info *r2t, int left)
1212 {
1213 struct iscsi_data *hdr;
1214 int new_offset;
1215
1216 hdr = &r2t->dtask.hdr;
1217 memset(hdr, 0, sizeof(struct iscsi_data));
1218 hdr->ttt = r2t->ttt;
1219 hdr->datasn = cpu_to_be32(r2t->solicit_datasn);
1220 r2t->solicit_datasn++;
1221 hdr->opcode = ISCSI_OP_SCSI_DATA_OUT;
1222 memcpy(hdr->lun, ctask->hdr->lun, sizeof(hdr->lun));
1223 hdr->itt = ctask->hdr->itt;
1224 hdr->exp_statsn = r2t->exp_statsn;
1225 new_offset = r2t->data_offset + r2t->sent;
1226 hdr->offset = cpu_to_be32(new_offset);
1227 if (left > conn->max_xmit_dlength) {
1228 hton24(hdr->dlength, conn->max_xmit_dlength);
1229 r2t->data_count = conn->max_xmit_dlength;
1230 } else {
1231 hton24(hdr->dlength, left);
1232 r2t->data_count = left;
1233 hdr->flags = ISCSI_FLAG_CMD_FINAL;
1234 }
1235 conn->dataout_pdus_cnt++;
1236
1237 iscsi_buf_init_iov(&r2t->headbuf, (char*)hdr,
1238 sizeof(struct iscsi_hdr));
1239
1240 if (iscsi_buf_left(&r2t->sendbuf))
1241 return;
1242
1243 iscsi_buf_init_sg(&r2t->sendbuf, r2t->sg);
1244 r2t->sg += 1;
1245 }
1246
1247 static void iscsi_set_padding(struct iscsi_tcp_cmd_task *tcp_ctask,
1248 unsigned long len)
1249 {
1250 tcp_ctask->pad_count = len & (ISCSI_PAD_LEN - 1);
1251 if (!tcp_ctask->pad_count)
1252 return;
1253
1254 tcp_ctask->pad_count = ISCSI_PAD_LEN - tcp_ctask->pad_count;
1255 debug_scsi("write padding %d bytes\n", tcp_ctask->pad_count);
1256 tcp_ctask->xmstate |= XMSTATE_W_PAD;
1257 }
1258
1259 /**
1260 * iscsi_tcp_cmd_init - Initialize iSCSI SCSI_READ or SCSI_WRITE commands
1261 * @conn: iscsi connection
1262 * @ctask: scsi command task
1263 * @sc: scsi command
1264 **/
1265 static void
1266 iscsi_tcp_cmd_init(struct iscsi_cmd_task *ctask)
1267 {
1268 struct iscsi_tcp_cmd_task *tcp_ctask = ctask->dd_data;
1269
1270 BUG_ON(__kfifo_len(tcp_ctask->r2tqueue));
1271 tcp_ctask->xmstate = XMSTATE_CMD_HDR_INIT;
1272 }
1273
1274 /**
1275 * iscsi_tcp_mtask_xmit - xmit management(immediate) task
1276 * @conn: iscsi connection
1277 * @mtask: task management task
1278 *
1279 * Notes:
1280 * The function can return -EAGAIN in which case caller must
1281 * call it again later, or recover. '0' return code means successful
1282 * xmit.
1283 *
1284 * Management xmit state machine consists of these states:
1285 * XMSTATE_IMM_HDR_INIT - calculate digest of PDU Header
1286 * XMSTATE_IMM_HDR - PDU Header xmit in progress
1287 * XMSTATE_IMM_DATA - PDU Data xmit in progress
1288 * XMSTATE_IDLE - management PDU is done
1289 **/
1290 static int
1291 iscsi_tcp_mtask_xmit(struct iscsi_conn *conn, struct iscsi_mgmt_task *mtask)
1292 {
1293 struct iscsi_tcp_mgmt_task *tcp_mtask = mtask->dd_data;
1294 int rc;
1295
1296 debug_scsi("mtask deq [cid %d state %x itt 0x%x]\n",
1297 conn->id, tcp_mtask->xmstate, mtask->itt);
1298
1299 if (tcp_mtask->xmstate & XMSTATE_IMM_HDR_INIT) {
1300 iscsi_buf_init_iov(&tcp_mtask->headbuf, (char*)mtask->hdr,
1301 sizeof(struct iscsi_hdr));
1302
1303 if (mtask->data_count) {
1304 tcp_mtask->xmstate |= XMSTATE_IMM_DATA;
1305 iscsi_buf_init_iov(&tcp_mtask->sendbuf,
1306 (char*)mtask->data,
1307 mtask->data_count);
1308 }
1309
1310 if (conn->c_stage != ISCSI_CONN_INITIAL_STAGE &&
1311 conn->stop_stage != STOP_CONN_RECOVER &&
1312 conn->hdrdgst_en)
1313 iscsi_hdr_digest(conn, &tcp_mtask->headbuf,
1314 (u8*)tcp_mtask->hdrext);
1315
1316 tcp_mtask->sent = 0;
1317 tcp_mtask->xmstate &= ~XMSTATE_IMM_HDR_INIT;
1318 tcp_mtask->xmstate |= XMSTATE_IMM_HDR;
1319 }
1320
1321 if (tcp_mtask->xmstate & XMSTATE_IMM_HDR) {
1322 rc = iscsi_sendhdr(conn, &tcp_mtask->headbuf,
1323 mtask->data_count);
1324 if (rc)
1325 return rc;
1326 tcp_mtask->xmstate &= ~XMSTATE_IMM_HDR;
1327 }
1328
1329 if (tcp_mtask->xmstate & XMSTATE_IMM_DATA) {
1330 BUG_ON(!mtask->data_count);
1331 tcp_mtask->xmstate &= ~XMSTATE_IMM_DATA;
1332 /* FIXME: implement.
1333 * Virtual buffer could be spreaded across multiple pages...
1334 */
1335 do {
1336 int rc;
1337
1338 rc = iscsi_sendpage(conn, &tcp_mtask->sendbuf,
1339 &mtask->data_count, &tcp_mtask->sent);
1340 if (rc) {
1341 tcp_mtask->xmstate |= XMSTATE_IMM_DATA;
1342 return rc;
1343 }
1344 } while (mtask->data_count);
1345 }
1346
1347 BUG_ON(tcp_mtask->xmstate != XMSTATE_IDLE);
1348 if (mtask->hdr->itt == RESERVED_ITT) {
1349 struct iscsi_session *session = conn->session;
1350
1351 spin_lock_bh(&session->lock);
1352 list_del(&conn->mtask->running);
1353 __kfifo_put(session->mgmtpool.queue, (void*)&conn->mtask,
1354 sizeof(void*));
1355 spin_unlock_bh(&session->lock);
1356 }
1357 return 0;
1358 }
1359
1360 static int
1361 iscsi_send_cmd_hdr(struct iscsi_conn *conn, struct iscsi_cmd_task *ctask)
1362 {
1363 struct scsi_cmnd *sc = ctask->sc;
1364 struct iscsi_tcp_cmd_task *tcp_ctask = ctask->dd_data;
1365 int rc = 0;
1366
1367 if (tcp_ctask->xmstate & XMSTATE_CMD_HDR_INIT) {
1368 tcp_ctask->sent = 0;
1369 tcp_ctask->sg_count = 0;
1370 tcp_ctask->exp_datasn = 0;
1371
1372 if (sc->sc_data_direction == DMA_TO_DEVICE) {
1373 struct scatterlist *sg = scsi_sglist(sc);
1374
1375 iscsi_buf_init_sg(&tcp_ctask->sendbuf, sg);
1376 tcp_ctask->sg = sg + 1;
1377 tcp_ctask->bad_sg = sg + scsi_sg_count(sc);
1378
1379 debug_scsi("cmd [itt 0x%x total %d imm_data %d "
1380 "unsol count %d, unsol offset %d]\n",
1381 ctask->itt, scsi_bufflen(sc),
1382 ctask->imm_count, ctask->unsol_count,
1383 ctask->unsol_offset);
1384 }
1385
1386 iscsi_buf_init_iov(&tcp_ctask->headbuf, (char*)ctask->hdr,
1387 ctask->hdr_len);
1388
1389 if (conn->hdrdgst_en)
1390 iscsi_hdr_digest(conn, &tcp_ctask->headbuf,
1391 iscsi_next_hdr(ctask));
1392 tcp_ctask->xmstate &= ~XMSTATE_CMD_HDR_INIT;
1393 tcp_ctask->xmstate |= XMSTATE_CMD_HDR_XMIT;
1394 }
1395
1396 if (tcp_ctask->xmstate & XMSTATE_CMD_HDR_XMIT) {
1397 rc = iscsi_sendhdr(conn, &tcp_ctask->headbuf, ctask->imm_count);
1398 if (rc)
1399 return rc;
1400 tcp_ctask->xmstate &= ~XMSTATE_CMD_HDR_XMIT;
1401
1402 if (sc->sc_data_direction != DMA_TO_DEVICE)
1403 return 0;
1404
1405 if (ctask->imm_count) {
1406 tcp_ctask->xmstate |= XMSTATE_IMM_DATA;
1407 iscsi_set_padding(tcp_ctask, ctask->imm_count);
1408
1409 if (ctask->conn->datadgst_en) {
1410 iscsi_data_digest_init(ctask->conn->dd_data,
1411 tcp_ctask);
1412 tcp_ctask->immdigest = 0;
1413 }
1414 }
1415
1416 if (ctask->unsol_count)
1417 tcp_ctask->xmstate |=
1418 XMSTATE_UNS_HDR | XMSTATE_UNS_INIT;
1419 }
1420 return rc;
1421 }
1422
1423 static int
1424 iscsi_send_padding(struct iscsi_conn *conn, struct iscsi_cmd_task *ctask)
1425 {
1426 struct iscsi_tcp_cmd_task *tcp_ctask = ctask->dd_data;
1427 struct iscsi_tcp_conn *tcp_conn = conn->dd_data;
1428 int sent = 0, rc;
1429
1430 if (tcp_ctask->xmstate & XMSTATE_W_PAD) {
1431 iscsi_buf_init_iov(&tcp_ctask->sendbuf, (char*)&tcp_ctask->pad,
1432 tcp_ctask->pad_count);
1433 if (conn->datadgst_en)
1434 crypto_hash_update(&tcp_conn->tx_hash,
1435 &tcp_ctask->sendbuf.sg,
1436 tcp_ctask->sendbuf.sg.length);
1437 } else if (!(tcp_ctask->xmstate & XMSTATE_W_RESEND_PAD))
1438 return 0;
1439
1440 tcp_ctask->xmstate &= ~XMSTATE_W_PAD;
1441 tcp_ctask->xmstate &= ~XMSTATE_W_RESEND_PAD;
1442 debug_scsi("sending %d pad bytes for itt 0x%x\n",
1443 tcp_ctask->pad_count, ctask->itt);
1444 rc = iscsi_sendpage(conn, &tcp_ctask->sendbuf, &tcp_ctask->pad_count,
1445 &sent);
1446 if (rc) {
1447 debug_scsi("padding send failed %d\n", rc);
1448 tcp_ctask->xmstate |= XMSTATE_W_RESEND_PAD;
1449 }
1450 return rc;
1451 }
1452
1453 static int
1454 iscsi_send_digest(struct iscsi_conn *conn, struct iscsi_cmd_task *ctask,
1455 struct iscsi_buf *buf, uint32_t *digest)
1456 {
1457 struct iscsi_tcp_cmd_task *tcp_ctask;
1458 struct iscsi_tcp_conn *tcp_conn;
1459 int rc, sent = 0;
1460
1461 if (!conn->datadgst_en)
1462 return 0;
1463
1464 tcp_ctask = ctask->dd_data;
1465 tcp_conn = conn->dd_data;
1466
1467 if (!(tcp_ctask->xmstate & XMSTATE_W_RESEND_DATA_DIGEST)) {
1468 crypto_hash_final(&tcp_conn->tx_hash, (u8*)digest);
1469 iscsi_buf_init_iov(buf, (char*)digest, 4);
1470 }
1471 tcp_ctask->xmstate &= ~XMSTATE_W_RESEND_DATA_DIGEST;
1472
1473 rc = iscsi_sendpage(conn, buf, &tcp_ctask->digest_count, &sent);
1474 if (!rc)
1475 debug_scsi("sent digest 0x%x for itt 0x%x\n", *digest,
1476 ctask->itt);
1477 else {
1478 debug_scsi("sending digest 0x%x failed for itt 0x%x!\n",
1479 *digest, ctask->itt);
1480 tcp_ctask->xmstate |= XMSTATE_W_RESEND_DATA_DIGEST;
1481 }
1482 return rc;
1483 }
1484
1485 static int
1486 iscsi_send_data(struct iscsi_cmd_task *ctask, struct iscsi_buf *sendbuf,
1487 struct scatterlist **sg, int *sent, int *count,
1488 struct iscsi_buf *digestbuf, uint32_t *digest)
1489 {
1490 struct iscsi_tcp_cmd_task *tcp_ctask = ctask->dd_data;
1491 struct iscsi_conn *conn = ctask->conn;
1492 struct iscsi_tcp_conn *tcp_conn = conn->dd_data;
1493 int rc, buf_sent, offset;
1494
1495 while (*count) {
1496 buf_sent = 0;
1497 offset = sendbuf->sent;
1498
1499 rc = iscsi_sendpage(conn, sendbuf, count, &buf_sent);
1500 *sent = *sent + buf_sent;
1501 if (buf_sent && conn->datadgst_en)
1502 partial_sg_digest_update(&tcp_conn->tx_hash,
1503 &sendbuf->sg, sendbuf->sg.offset + offset,
1504 buf_sent);
1505 if (!iscsi_buf_left(sendbuf) && *sg != tcp_ctask->bad_sg) {
1506 iscsi_buf_init_sg(sendbuf, *sg);
1507 *sg = *sg + 1;
1508 }
1509
1510 if (rc)
1511 return rc;
1512 }
1513
1514 rc = iscsi_send_padding(conn, ctask);
1515 if (rc)
1516 return rc;
1517
1518 return iscsi_send_digest(conn, ctask, digestbuf, digest);
1519 }
1520
1521 static int
1522 iscsi_send_unsol_hdr(struct iscsi_conn *conn, struct iscsi_cmd_task *ctask)
1523 {
1524 struct iscsi_tcp_cmd_task *tcp_ctask = ctask->dd_data;
1525 struct iscsi_data_task *dtask;
1526 int rc;
1527
1528 tcp_ctask->xmstate |= XMSTATE_UNS_DATA;
1529 if (tcp_ctask->xmstate & XMSTATE_UNS_INIT) {
1530 dtask = &tcp_ctask->unsol_dtask;
1531
1532 iscsi_prep_unsolicit_data_pdu(ctask, &dtask->hdr);
1533 iscsi_buf_init_iov(&tcp_ctask->headbuf, (char*)&dtask->hdr,
1534 sizeof(struct iscsi_hdr));
1535 if (conn->hdrdgst_en)
1536 iscsi_hdr_digest(conn, &tcp_ctask->headbuf,
1537 (u8*)dtask->hdrext);
1538
1539 tcp_ctask->xmstate &= ~XMSTATE_UNS_INIT;
1540 iscsi_set_padding(tcp_ctask, ctask->data_count);
1541 }
1542
1543 rc = iscsi_sendhdr(conn, &tcp_ctask->headbuf, ctask->data_count);
1544 if (rc) {
1545 tcp_ctask->xmstate &= ~XMSTATE_UNS_DATA;
1546 tcp_ctask->xmstate |= XMSTATE_UNS_HDR;
1547 return rc;
1548 }
1549
1550 if (conn->datadgst_en) {
1551 dtask = &tcp_ctask->unsol_dtask;
1552 iscsi_data_digest_init(ctask->conn->dd_data, tcp_ctask);
1553 dtask->digest = 0;
1554 }
1555
1556 debug_scsi("uns dout [itt 0x%x dlen %d sent %d]\n",
1557 ctask->itt, ctask->unsol_count, tcp_ctask->sent);
1558 return 0;
1559 }
1560
1561 static int
1562 iscsi_send_unsol_pdu(struct iscsi_conn *conn, struct iscsi_cmd_task *ctask)
1563 {
1564 struct iscsi_tcp_cmd_task *tcp_ctask = ctask->dd_data;
1565 int rc;
1566
1567 if (tcp_ctask->xmstate & XMSTATE_UNS_HDR) {
1568 BUG_ON(!ctask->unsol_count);
1569 tcp_ctask->xmstate &= ~XMSTATE_UNS_HDR;
1570 send_hdr:
1571 rc = iscsi_send_unsol_hdr(conn, ctask);
1572 if (rc)
1573 return rc;
1574 }
1575
1576 if (tcp_ctask->xmstate & XMSTATE_UNS_DATA) {
1577 struct iscsi_data_task *dtask = &tcp_ctask->unsol_dtask;
1578 int start = tcp_ctask->sent;
1579
1580 rc = iscsi_send_data(ctask, &tcp_ctask->sendbuf, &tcp_ctask->sg,
1581 &tcp_ctask->sent, &ctask->data_count,
1582 &dtask->digestbuf, &dtask->digest);
1583 ctask->unsol_count -= tcp_ctask->sent - start;
1584 if (rc)
1585 return rc;
1586 tcp_ctask->xmstate &= ~XMSTATE_UNS_DATA;
1587 /*
1588 * Done with the Data-Out. Next, check if we need
1589 * to send another unsolicited Data-Out.
1590 */
1591 if (ctask->unsol_count) {
1592 debug_scsi("sending more uns\n");
1593 tcp_ctask->xmstate |= XMSTATE_UNS_INIT;
1594 goto send_hdr;
1595 }
1596 }
1597 return 0;
1598 }
1599
1600 static int iscsi_send_sol_pdu(struct iscsi_conn *conn,
1601 struct iscsi_cmd_task *ctask)
1602 {
1603 struct iscsi_tcp_cmd_task *tcp_ctask = ctask->dd_data;
1604 struct iscsi_session *session = conn->session;
1605 struct iscsi_r2t_info *r2t;
1606 struct iscsi_data_task *dtask;
1607 int left, rc;
1608
1609 if (tcp_ctask->xmstate & XMSTATE_SOL_HDR_INIT) {
1610 if (!tcp_ctask->r2t) {
1611 spin_lock_bh(&session->lock);
1612 __kfifo_get(tcp_ctask->r2tqueue, (void*)&tcp_ctask->r2t,
1613 sizeof(void*));
1614 spin_unlock_bh(&session->lock);
1615 }
1616 send_hdr:
1617 r2t = tcp_ctask->r2t;
1618 dtask = &r2t->dtask;
1619
1620 if (conn->hdrdgst_en)
1621 iscsi_hdr_digest(conn, &r2t->headbuf,
1622 (u8*)dtask->hdrext);
1623 tcp_ctask->xmstate &= ~XMSTATE_SOL_HDR_INIT;
1624 tcp_ctask->xmstate |= XMSTATE_SOL_HDR;
1625 }
1626
1627 if (tcp_ctask->xmstate & XMSTATE_SOL_HDR) {
1628 r2t = tcp_ctask->r2t;
1629 dtask = &r2t->dtask;
1630
1631 rc = iscsi_sendhdr(conn, &r2t->headbuf, r2t->data_count);
1632 if (rc)
1633 return rc;
1634 tcp_ctask->xmstate &= ~XMSTATE_SOL_HDR;
1635 tcp_ctask->xmstate |= XMSTATE_SOL_DATA;
1636
1637 if (conn->datadgst_en) {
1638 iscsi_data_digest_init(conn->dd_data, tcp_ctask);
1639 dtask->digest = 0;
1640 }
1641
1642 iscsi_set_padding(tcp_ctask, r2t->data_count);
1643 debug_scsi("sol dout [dsn %d itt 0x%x dlen %d sent %d]\n",
1644 r2t->solicit_datasn - 1, ctask->itt, r2t->data_count,
1645 r2t->sent);
1646 }
1647
1648 if (tcp_ctask->xmstate & XMSTATE_SOL_DATA) {
1649 r2t = tcp_ctask->r2t;
1650 dtask = &r2t->dtask;
1651
1652 rc = iscsi_send_data(ctask, &r2t->sendbuf, &r2t->sg,
1653 &r2t->sent, &r2t->data_count,
1654 &dtask->digestbuf, &dtask->digest);
1655 if (rc)
1656 return rc;
1657 tcp_ctask->xmstate &= ~XMSTATE_SOL_DATA;
1658
1659 /*
1660 * Done with this Data-Out. Next, check if we have
1661 * to send another Data-Out for this R2T.
1662 */
1663 BUG_ON(r2t->data_length - r2t->sent < 0);
1664 left = r2t->data_length - r2t->sent;
1665 if (left) {
1666 iscsi_solicit_data_cont(conn, ctask, r2t, left);
1667 goto send_hdr;
1668 }
1669
1670 /*
1671 * Done with this R2T. Check if there are more
1672 * outstanding R2Ts ready to be processed.
1673 */
1674 spin_lock_bh(&session->lock);
1675 tcp_ctask->r2t = NULL;
1676 __kfifo_put(tcp_ctask->r2tpool.queue, (void*)&r2t,
1677 sizeof(void*));
1678 if (__kfifo_get(tcp_ctask->r2tqueue, (void*)&r2t,
1679 sizeof(void*))) {
1680 tcp_ctask->r2t = r2t;
1681 spin_unlock_bh(&session->lock);
1682 goto send_hdr;
1683 }
1684 spin_unlock_bh(&session->lock);
1685 }
1686 return 0;
1687 }
1688
1689 /**
1690 * iscsi_tcp_ctask_xmit - xmit normal PDU task
1691 * @conn: iscsi connection
1692 * @ctask: iscsi command task
1693 *
1694 * Notes:
1695 * The function can return -EAGAIN in which case caller must
1696 * call it again later, or recover. '0' return code means successful
1697 * xmit.
1698 * The function is devided to logical helpers (above) for the different
1699 * xmit stages.
1700 *
1701 *iscsi_send_cmd_hdr()
1702 * XMSTATE_CMD_HDR_INIT - prepare Header and Data buffers Calculate
1703 * Header Digest
1704 * XMSTATE_CMD_HDR_XMIT - Transmit header in progress
1705 *
1706 *iscsi_send_padding
1707 * XMSTATE_W_PAD - Prepare and send pading
1708 * XMSTATE_W_RESEND_PAD - retry send pading
1709 *
1710 *iscsi_send_digest
1711 * XMSTATE_W_RESEND_DATA_DIGEST - Finalize and send Data Digest
1712 * XMSTATE_W_RESEND_DATA_DIGEST - retry sending digest
1713 *
1714 *iscsi_send_unsol_hdr
1715 * XMSTATE_UNS_INIT - prepare un-solicit data header and digest
1716 * XMSTATE_UNS_HDR - send un-solicit header
1717 *
1718 *iscsi_send_unsol_pdu
1719 * XMSTATE_UNS_DATA - send un-solicit data in progress
1720 *
1721 *iscsi_send_sol_pdu
1722 * XMSTATE_SOL_HDR_INIT - solicit data header and digest initialize
1723 * XMSTATE_SOL_HDR - send solicit header
1724 * XMSTATE_SOL_DATA - send solicit data
1725 *
1726 *iscsi_tcp_ctask_xmit
1727 * XMSTATE_IMM_DATA - xmit managment data (??)
1728 **/
1729 static int
1730 iscsi_tcp_ctask_xmit(struct iscsi_conn *conn, struct iscsi_cmd_task *ctask)
1731 {
1732 struct iscsi_tcp_cmd_task *tcp_ctask = ctask->dd_data;
1733 int rc = 0;
1734
1735 debug_scsi("ctask deq [cid %d xmstate %x itt 0x%x]\n",
1736 conn->id, tcp_ctask->xmstate, ctask->itt);
1737
1738 rc = iscsi_send_cmd_hdr(conn, ctask);
1739 if (rc)
1740 return rc;
1741 if (ctask->sc->sc_data_direction != DMA_TO_DEVICE)
1742 return 0;
1743
1744 if (tcp_ctask->xmstate & XMSTATE_IMM_DATA) {
1745 rc = iscsi_send_data(ctask, &tcp_ctask->sendbuf, &tcp_ctask->sg,
1746 &tcp_ctask->sent, &ctask->imm_count,
1747 &tcp_ctask->immbuf, &tcp_ctask->immdigest);
1748 if (rc)
1749 return rc;
1750 tcp_ctask->xmstate &= ~XMSTATE_IMM_DATA;
1751 }
1752
1753 rc = iscsi_send_unsol_pdu(conn, ctask);
1754 if (rc)
1755 return rc;
1756
1757 rc = iscsi_send_sol_pdu(conn, ctask);
1758 if (rc)
1759 return rc;
1760
1761 return rc;
1762 }
1763
1764 static struct iscsi_cls_conn *
1765 iscsi_tcp_conn_create(struct iscsi_cls_session *cls_session, uint32_t conn_idx)
1766 {
1767 struct iscsi_conn *conn;
1768 struct iscsi_cls_conn *cls_conn;
1769 struct iscsi_tcp_conn *tcp_conn;
1770
1771 cls_conn = iscsi_conn_setup(cls_session, conn_idx);
1772 if (!cls_conn)
1773 return NULL;
1774 conn = cls_conn->dd_data;
1775 /*
1776 * due to strange issues with iser these are not set
1777 * in iscsi_conn_setup
1778 */
1779 conn->max_recv_dlength = ISCSI_DEF_MAX_RECV_SEG_LEN;
1780
1781 tcp_conn = kzalloc(sizeof(*tcp_conn), GFP_KERNEL);
1782 if (!tcp_conn)
1783 goto tcp_conn_alloc_fail;
1784
1785 conn->dd_data = tcp_conn;
1786 tcp_conn->iscsi_conn = conn;
1787
1788 tcp_conn->tx_hash.tfm = crypto_alloc_hash("crc32c", 0,
1789 CRYPTO_ALG_ASYNC);
1790 tcp_conn->tx_hash.flags = 0;
1791 if (IS_ERR(tcp_conn->tx_hash.tfm)) {
1792 printk(KERN_ERR "Could not create connection due to crc32c "
1793 "loading error %ld. Make sure the crc32c module is "
1794 "built as a module or into the kernel\n",
1795 PTR_ERR(tcp_conn->tx_hash.tfm));
1796 goto free_tcp_conn;
1797 }
1798
1799 tcp_conn->rx_hash.tfm = crypto_alloc_hash("crc32c", 0,
1800 CRYPTO_ALG_ASYNC);
1801 tcp_conn->rx_hash.flags = 0;
1802 if (IS_ERR(tcp_conn->rx_hash.tfm)) {
1803 printk(KERN_ERR "Could not create connection due to crc32c "
1804 "loading error %ld. Make sure the crc32c module is "
1805 "built as a module or into the kernel\n",
1806 PTR_ERR(tcp_conn->rx_hash.tfm));
1807 goto free_tx_tfm;
1808 }
1809
1810 return cls_conn;
1811
1812 free_tx_tfm:
1813 crypto_free_hash(tcp_conn->tx_hash.tfm);
1814 free_tcp_conn:
1815 kfree(tcp_conn);
1816 tcp_conn_alloc_fail:
1817 iscsi_conn_teardown(cls_conn);
1818 return NULL;
1819 }
1820
1821 static void
1822 iscsi_tcp_release_conn(struct iscsi_conn *conn)
1823 {
1824 struct iscsi_session *session = conn->session;
1825 struct iscsi_tcp_conn *tcp_conn = conn->dd_data;
1826 struct socket *sock = tcp_conn->sock;
1827
1828 if (!sock)
1829 return;
1830
1831 sock_hold(sock->sk);
1832 iscsi_conn_restore_callbacks(tcp_conn);
1833 sock_put(sock->sk);
1834
1835 spin_lock_bh(&session->lock);
1836 tcp_conn->sock = NULL;
1837 conn->recv_lock = NULL;
1838 spin_unlock_bh(&session->lock);
1839 sockfd_put(sock);
1840 }
1841
1842 static void
1843 iscsi_tcp_conn_destroy(struct iscsi_cls_conn *cls_conn)
1844 {
1845 struct iscsi_conn *conn = cls_conn->dd_data;
1846 struct iscsi_tcp_conn *tcp_conn = conn->dd_data;
1847
1848 iscsi_tcp_release_conn(conn);
1849 iscsi_conn_teardown(cls_conn);
1850
1851 if (tcp_conn->tx_hash.tfm)
1852 crypto_free_hash(tcp_conn->tx_hash.tfm);
1853 if (tcp_conn->rx_hash.tfm)
1854 crypto_free_hash(tcp_conn->rx_hash.tfm);
1855
1856 kfree(tcp_conn);
1857 }
1858
1859 static void
1860 iscsi_tcp_conn_stop(struct iscsi_cls_conn *cls_conn, int flag)
1861 {
1862 struct iscsi_conn *conn = cls_conn->dd_data;
1863
1864 iscsi_conn_stop(cls_conn, flag);
1865 iscsi_tcp_release_conn(conn);
1866 }
1867
1868 static int iscsi_tcp_get_addr(struct iscsi_conn *conn, struct socket *sock,
1869 char *buf, int *port,
1870 int (*getname)(struct socket *, struct sockaddr *,
1871 int *addrlen))
1872 {
1873 struct sockaddr_storage *addr;
1874 struct sockaddr_in6 *sin6;
1875 struct sockaddr_in *sin;
1876 int rc = 0, len;
1877
1878 addr = kmalloc(sizeof(*addr), GFP_KERNEL);
1879 if (!addr)
1880 return -ENOMEM;
1881
1882 if (getname(sock, (struct sockaddr *) addr, &len)) {
1883 rc = -ENODEV;
1884 goto free_addr;
1885 }
1886
1887 switch (addr->ss_family) {
1888 case AF_INET:
1889 sin = (struct sockaddr_in *)addr;
1890 spin_lock_bh(&conn->session->lock);
1891 sprintf(buf, NIPQUAD_FMT, NIPQUAD(sin->sin_addr.s_addr));
1892 *port = be16_to_cpu(sin->sin_port);
1893 spin_unlock_bh(&conn->session->lock);
1894 break;
1895 case AF_INET6:
1896 sin6 = (struct sockaddr_in6 *)addr;
1897 spin_lock_bh(&conn->session->lock);
1898 sprintf(buf, NIP6_FMT, NIP6(sin6->sin6_addr));
1899 *port = be16_to_cpu(sin6->sin6_port);
1900 spin_unlock_bh(&conn->session->lock);
1901 break;
1902 }
1903 free_addr:
1904 kfree(addr);
1905 return rc;
1906 }
1907
1908 static int
1909 iscsi_tcp_conn_bind(struct iscsi_cls_session *cls_session,
1910 struct iscsi_cls_conn *cls_conn, uint64_t transport_eph,
1911 int is_leading)
1912 {
1913 struct iscsi_conn *conn = cls_conn->dd_data;
1914 struct iscsi_tcp_conn *tcp_conn = conn->dd_data;
1915 struct sock *sk;
1916 struct socket *sock;
1917 int err;
1918
1919 /* lookup for existing socket */
1920 sock = sockfd_lookup((int)transport_eph, &err);
1921 if (!sock) {
1922 printk(KERN_ERR "iscsi_tcp: sockfd_lookup failed %d\n", err);
1923 return -EEXIST;
1924 }
1925 /*
1926 * copy these values now because if we drop the session
1927 * userspace may still want to query the values since we will
1928 * be using them for the reconnect
1929 */
1930 err = iscsi_tcp_get_addr(conn, sock, conn->portal_address,
1931 &conn->portal_port, kernel_getpeername);
1932 if (err)
1933 goto free_socket;
1934
1935 err = iscsi_tcp_get_addr(conn, sock, conn->local_address,
1936 &conn->local_port, kernel_getsockname);
1937 if (err)
1938 goto free_socket;
1939
1940 err = iscsi_conn_bind(cls_session, cls_conn, is_leading);
1941 if (err)
1942 goto free_socket;
1943
1944 /* bind iSCSI connection and socket */
1945 tcp_conn->sock = sock;
1946
1947 /* setup Socket parameters */
1948 sk = sock->sk;
1949 sk->sk_reuse = 1;
1950 sk->sk_sndtimeo = 15 * HZ; /* FIXME: make it configurable */
1951 sk->sk_allocation = GFP_ATOMIC;
1952
1953 /* FIXME: disable Nagle's algorithm */
1954
1955 /*
1956 * Intercept TCP callbacks for sendfile like receive
1957 * processing.
1958 */
1959 conn->recv_lock = &sk->sk_callback_lock;
1960 iscsi_conn_set_callbacks(conn);
1961 tcp_conn->sendpage = tcp_conn->sock->ops->sendpage;
1962 /*
1963 * set receive state machine into initial state
1964 */
1965 iscsi_tcp_hdr_recv_prep(tcp_conn);
1966 return 0;
1967
1968 free_socket:
1969 sockfd_put(sock);
1970 return err;
1971 }
1972
1973 /* called with host lock */
1974 static void
1975 iscsi_tcp_mgmt_init(struct iscsi_conn *conn, struct iscsi_mgmt_task *mtask)
1976 {
1977 struct iscsi_tcp_mgmt_task *tcp_mtask = mtask->dd_data;
1978 tcp_mtask->xmstate = XMSTATE_IMM_HDR_INIT;
1979 }
1980
1981 static int
1982 iscsi_r2tpool_alloc(struct iscsi_session *session)
1983 {
1984 int i;
1985 int cmd_i;
1986
1987 /*
1988 * initialize per-task: R2T pool and xmit queue
1989 */
1990 for (cmd_i = 0; cmd_i < session->cmds_max; cmd_i++) {
1991 struct iscsi_cmd_task *ctask = session->cmds[cmd_i];
1992 struct iscsi_tcp_cmd_task *tcp_ctask = ctask->dd_data;
1993
1994 /*
1995 * pre-allocated x4 as much r2ts to handle race when
1996 * target acks DataOut faster than we data_xmit() queues
1997 * could replenish r2tqueue.
1998 */
1999
2000 /* R2T pool */
2001 if (iscsi_pool_init(&tcp_ctask->r2tpool, session->max_r2t * 4,
2002 (void***)&tcp_ctask->r2ts,
2003 sizeof(struct iscsi_r2t_info))) {
2004 goto r2t_alloc_fail;
2005 }
2006
2007 /* R2T xmit queue */
2008 tcp_ctask->r2tqueue = kfifo_alloc(
2009 session->max_r2t * 4 * sizeof(void*), GFP_KERNEL, NULL);
2010 if (tcp_ctask->r2tqueue == ERR_PTR(-ENOMEM)) {
2011 iscsi_pool_free(&tcp_ctask->r2tpool,
2012 (void**)tcp_ctask->r2ts);
2013 goto r2t_alloc_fail;
2014 }
2015 }
2016
2017 return 0;
2018
2019 r2t_alloc_fail:
2020 for (i = 0; i < cmd_i; i++) {
2021 struct iscsi_cmd_task *ctask = session->cmds[i];
2022 struct iscsi_tcp_cmd_task *tcp_ctask = ctask->dd_data;
2023
2024 kfifo_free(tcp_ctask->r2tqueue);
2025 iscsi_pool_free(&tcp_ctask->r2tpool,
2026 (void**)tcp_ctask->r2ts);
2027 }
2028 return -ENOMEM;
2029 }
2030
2031 static void
2032 iscsi_r2tpool_free(struct iscsi_session *session)
2033 {
2034 int i;
2035
2036 for (i = 0; i < session->cmds_max; i++) {
2037 struct iscsi_cmd_task *ctask = session->cmds[i];
2038 struct iscsi_tcp_cmd_task *tcp_ctask = ctask->dd_data;
2039
2040 kfifo_free(tcp_ctask->r2tqueue);
2041 iscsi_pool_free(&tcp_ctask->r2tpool,
2042 (void**)tcp_ctask->r2ts);
2043 }
2044 }
2045
2046 static int
2047 iscsi_conn_set_param(struct iscsi_cls_conn *cls_conn, enum iscsi_param param,
2048 char *buf, int buflen)
2049 {
2050 struct iscsi_conn *conn = cls_conn->dd_data;
2051 struct iscsi_session *session = conn->session;
2052 struct iscsi_tcp_conn *tcp_conn = conn->dd_data;
2053 int value;
2054
2055 switch(param) {
2056 case ISCSI_PARAM_HDRDGST_EN:
2057 iscsi_set_param(cls_conn, param, buf, buflen);
2058 break;
2059 case ISCSI_PARAM_DATADGST_EN:
2060 iscsi_set_param(cls_conn, param, buf, buflen);
2061 tcp_conn->sendpage = conn->datadgst_en ?
2062 sock_no_sendpage : tcp_conn->sock->ops->sendpage;
2063 break;
2064 case ISCSI_PARAM_MAX_R2T:
2065 sscanf(buf, "%d", &value);
2066 if (session->max_r2t == roundup_pow_of_two(value))
2067 break;
2068 iscsi_r2tpool_free(session);
2069 iscsi_set_param(cls_conn, param, buf, buflen);
2070 if (session->max_r2t & (session->max_r2t - 1))
2071 session->max_r2t = roundup_pow_of_two(session->max_r2t);
2072 if (iscsi_r2tpool_alloc(session))
2073 return -ENOMEM;
2074 break;
2075 default:
2076 return iscsi_set_param(cls_conn, param, buf, buflen);
2077 }
2078
2079 return 0;
2080 }
2081
2082 static int
2083 iscsi_tcp_conn_get_param(struct iscsi_cls_conn *cls_conn,
2084 enum iscsi_param param, char *buf)
2085 {
2086 struct iscsi_conn *conn = cls_conn->dd_data;
2087 int len;
2088
2089 switch(param) {
2090 case ISCSI_PARAM_CONN_PORT:
2091 spin_lock_bh(&conn->session->lock);
2092 len = sprintf(buf, "%hu\n", conn->portal_port);
2093 spin_unlock_bh(&conn->session->lock);
2094 break;
2095 case ISCSI_PARAM_CONN_ADDRESS:
2096 spin_lock_bh(&conn->session->lock);
2097 len = sprintf(buf, "%s\n", conn->portal_address);
2098 spin_unlock_bh(&conn->session->lock);
2099 break;
2100 default:
2101 return iscsi_conn_get_param(cls_conn, param, buf);
2102 }
2103
2104 return len;
2105 }
2106
2107 static int
2108 iscsi_tcp_host_get_param(struct Scsi_Host *shost, enum iscsi_host_param param,
2109 char *buf)
2110 {
2111 struct iscsi_session *session = iscsi_hostdata(shost->hostdata);
2112 int len;
2113
2114 switch (param) {
2115 case ISCSI_HOST_PARAM_IPADDRESS:
2116 spin_lock_bh(&session->lock);
2117 if (!session->leadconn)
2118 len = -ENODEV;
2119 else
2120 len = sprintf(buf, "%s\n",
2121 session->leadconn->local_address);
2122 spin_unlock_bh(&session->lock);
2123 break;
2124 default:
2125 return iscsi_host_get_param(shost, param, buf);
2126 }
2127 return len;
2128 }
2129
2130 static void
2131 iscsi_conn_get_stats(struct iscsi_cls_conn *cls_conn, struct iscsi_stats *stats)
2132 {
2133 struct iscsi_conn *conn = cls_conn->dd_data;
2134 struct iscsi_tcp_conn *tcp_conn = conn->dd_data;
2135
2136 stats->txdata_octets = conn->txdata_octets;
2137 stats->rxdata_octets = conn->rxdata_octets;
2138 stats->scsicmd_pdus = conn->scsicmd_pdus_cnt;
2139 stats->dataout_pdus = conn->dataout_pdus_cnt;
2140 stats->scsirsp_pdus = conn->scsirsp_pdus_cnt;
2141 stats->datain_pdus = conn->datain_pdus_cnt;
2142 stats->r2t_pdus = conn->r2t_pdus_cnt;
2143 stats->tmfcmd_pdus = conn->tmfcmd_pdus_cnt;
2144 stats->tmfrsp_pdus = conn->tmfrsp_pdus_cnt;
2145 stats->custom_length = 3;
2146 strcpy(stats->custom[0].desc, "tx_sendpage_failures");
2147 stats->custom[0].value = tcp_conn->sendpage_failures_cnt;
2148 strcpy(stats->custom[1].desc, "rx_discontiguous_hdr");
2149 stats->custom[1].value = tcp_conn->discontiguous_hdr_cnt;
2150 strcpy(stats->custom[2].desc, "eh_abort_cnt");
2151 stats->custom[2].value = conn->eh_abort_cnt;
2152 }
2153
2154 static struct iscsi_cls_session *
2155 iscsi_tcp_session_create(struct iscsi_transport *iscsit,
2156 struct scsi_transport_template *scsit,
2157 uint16_t cmds_max, uint16_t qdepth,
2158 uint32_t initial_cmdsn, uint32_t *hostno)
2159 {
2160 struct iscsi_cls_session *cls_session;
2161 struct iscsi_session *session;
2162 uint32_t hn;
2163 int cmd_i;
2164
2165 cls_session = iscsi_session_setup(iscsit, scsit, cmds_max, qdepth,
2166 sizeof(struct iscsi_tcp_cmd_task),
2167 sizeof(struct iscsi_tcp_mgmt_task),
2168 initial_cmdsn, &hn);
2169 if (!cls_session)
2170 return NULL;
2171 *hostno = hn;
2172
2173 session = class_to_transport_session(cls_session);
2174 for (cmd_i = 0; cmd_i < session->cmds_max; cmd_i++) {
2175 struct iscsi_cmd_task *ctask = session->cmds[cmd_i];
2176 struct iscsi_tcp_cmd_task *tcp_ctask = ctask->dd_data;
2177
2178 ctask->hdr = &tcp_ctask->hdr.cmd_hdr;
2179 ctask->hdr_max = sizeof(tcp_ctask->hdr) - ISCSI_DIGEST_SIZE;
2180 }
2181
2182 for (cmd_i = 0; cmd_i < session->mgmtpool_max; cmd_i++) {
2183 struct iscsi_mgmt_task *mtask = session->mgmt_cmds[cmd_i];
2184 struct iscsi_tcp_mgmt_task *tcp_mtask = mtask->dd_data;
2185
2186 mtask->hdr = &tcp_mtask->hdr;
2187 }
2188
2189 if (iscsi_r2tpool_alloc(class_to_transport_session(cls_session)))
2190 goto r2tpool_alloc_fail;
2191
2192 return cls_session;
2193
2194 r2tpool_alloc_fail:
2195 iscsi_session_teardown(cls_session);
2196 return NULL;
2197 }
2198
2199 static void iscsi_tcp_session_destroy(struct iscsi_cls_session *cls_session)
2200 {
2201 iscsi_r2tpool_free(class_to_transport_session(cls_session));
2202 iscsi_session_teardown(cls_session);
2203 }
2204
2205 static int iscsi_tcp_slave_configure(struct scsi_device *sdev)
2206 {
2207 blk_queue_bounce_limit(sdev->request_queue, BLK_BOUNCE_ANY);
2208 blk_queue_dma_alignment(sdev->request_queue, 0);
2209 return 0;
2210 }
2211
2212 static struct scsi_host_template iscsi_sht = {
2213 .module = THIS_MODULE,
2214 .name = "iSCSI Initiator over TCP/IP",
2215 .queuecommand = iscsi_queuecommand,
2216 .change_queue_depth = iscsi_change_queue_depth,
2217 .can_queue = ISCSI_DEF_XMIT_CMDS_MAX - 1,
2218 .sg_tablesize = ISCSI_SG_TABLESIZE,
2219 .max_sectors = 0xFFFF,
2220 .cmd_per_lun = ISCSI_DEF_CMD_PER_LUN,
2221 .eh_abort_handler = iscsi_eh_abort,
2222 .eh_device_reset_handler= iscsi_eh_device_reset,
2223 .eh_host_reset_handler = iscsi_eh_host_reset,
2224 .use_clustering = DISABLE_CLUSTERING,
2225 .slave_configure = iscsi_tcp_slave_configure,
2226 .proc_name = "iscsi_tcp",
2227 .this_id = -1,
2228 };
2229
2230 static struct iscsi_transport iscsi_tcp_transport = {
2231 .owner = THIS_MODULE,
2232 .name = "tcp",
2233 .caps = CAP_RECOVERY_L0 | CAP_MULTI_R2T | CAP_HDRDGST
2234 | CAP_DATADGST,
2235 .param_mask = ISCSI_MAX_RECV_DLENGTH |
2236 ISCSI_MAX_XMIT_DLENGTH |
2237 ISCSI_HDRDGST_EN |
2238 ISCSI_DATADGST_EN |
2239 ISCSI_INITIAL_R2T_EN |
2240 ISCSI_MAX_R2T |
2241 ISCSI_IMM_DATA_EN |
2242 ISCSI_FIRST_BURST |
2243 ISCSI_MAX_BURST |
2244 ISCSI_PDU_INORDER_EN |
2245 ISCSI_DATASEQ_INORDER_EN |
2246 ISCSI_ERL |
2247 ISCSI_CONN_PORT |
2248 ISCSI_CONN_ADDRESS |
2249 ISCSI_EXP_STATSN |
2250 ISCSI_PERSISTENT_PORT |
2251 ISCSI_PERSISTENT_ADDRESS |
2252 ISCSI_TARGET_NAME | ISCSI_TPGT |
2253 ISCSI_USERNAME | ISCSI_PASSWORD |
2254 ISCSI_USERNAME_IN | ISCSI_PASSWORD_IN |
2255 ISCSI_FAST_ABORT,
2256 .host_param_mask = ISCSI_HOST_HWADDRESS | ISCSI_HOST_IPADDRESS |
2257 ISCSI_HOST_INITIATOR_NAME |
2258 ISCSI_HOST_NETDEV_NAME,
2259 .host_template = &iscsi_sht,
2260 .conndata_size = sizeof(struct iscsi_conn),
2261 .max_conn = 1,
2262 .max_cmd_len = ISCSI_TCP_MAX_CMD_LEN,
2263 /* session management */
2264 .create_session = iscsi_tcp_session_create,
2265 .destroy_session = iscsi_tcp_session_destroy,
2266 /* connection management */
2267 .create_conn = iscsi_tcp_conn_create,
2268 .bind_conn = iscsi_tcp_conn_bind,
2269 .destroy_conn = iscsi_tcp_conn_destroy,
2270 .set_param = iscsi_conn_set_param,
2271 .get_conn_param = iscsi_tcp_conn_get_param,
2272 .get_session_param = iscsi_session_get_param,
2273 .start_conn = iscsi_conn_start,
2274 .stop_conn = iscsi_tcp_conn_stop,
2275 /* iscsi host params */
2276 .get_host_param = iscsi_tcp_host_get_param,
2277 .set_host_param = iscsi_host_set_param,
2278 /* IO */
2279 .send_pdu = iscsi_conn_send_pdu,
2280 .get_stats = iscsi_conn_get_stats,
2281 .init_cmd_task = iscsi_tcp_cmd_init,
2282 .init_mgmt_task = iscsi_tcp_mgmt_init,
2283 .xmit_cmd_task = iscsi_tcp_ctask_xmit,
2284 .xmit_mgmt_task = iscsi_tcp_mtask_xmit,
2285 .cleanup_cmd_task = iscsi_tcp_cleanup_ctask,
2286 /* recovery */
2287 .session_recovery_timedout = iscsi_session_recovery_timedout,
2288 };
2289
2290 static int __init
2291 iscsi_tcp_init(void)
2292 {
2293 if (iscsi_max_lun < 1) {
2294 printk(KERN_ERR "iscsi_tcp: Invalid max_lun value of %u\n",
2295 iscsi_max_lun);
2296 return -EINVAL;
2297 }
2298 iscsi_tcp_transport.max_lun = iscsi_max_lun;
2299
2300 if (!iscsi_register_transport(&iscsi_tcp_transport))
2301 return -ENODEV;
2302
2303 return 0;
2304 }
2305
2306 static void __exit
2307 iscsi_tcp_exit(void)
2308 {
2309 iscsi_unregister_transport(&iscsi_tcp_transport);
2310 }
2311
2312 module_init(iscsi_tcp_init);
2313 module_exit(iscsi_tcp_exit);
This page took 0.121519 seconds and 5 git commands to generate.