Root/
1 | /* |
2 | * iSCSI Initiator over TCP/IP Data-Path |
3 | * |
4 | * Copyright (C) 2004 Dmitry Yusupov |
5 | * Copyright (C) 2004 Alex Aizman |
6 | * Copyright (C) 2005 - 2006 Mike Christie |
7 | * Copyright (C) 2006 Red Hat, Inc. All rights reserved. |
8 | * maintained by open-iscsi@googlegroups.com |
9 | * |
10 | * This program is free software; you can redistribute it and/or modify |
11 | * it under the terms of the GNU General Public License as published |
12 | * by the Free Software Foundation; either version 2 of the License, or |
13 | * (at your option) any later version. |
14 | * |
15 | * This program is distributed in the hope that it will be useful, but |
16 | * WITHOUT ANY WARRANTY; without even the implied warranty of |
17 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU |
18 | * General Public License for more details. |
19 | * |
20 | * See the file COPYING included with this distribution for more details. |
21 | * |
22 | * Credits: |
23 | * Christoph Hellwig |
24 | * FUJITA Tomonori |
25 | * Arne Redlich |
26 | * Zhenyu Wang |
27 | */ |
28 | |
29 | #include <linux/types.h> |
30 | #include <linux/inet.h> |
31 | #include <linux/slab.h> |
32 | #include <linux/file.h> |
33 | #include <linux/blkdev.h> |
34 | #include <linux/crypto.h> |
35 | #include <linux/delay.h> |
36 | #include <linux/kfifo.h> |
37 | #include <linux/scatterlist.h> |
38 | #include <net/tcp.h> |
39 | #include <scsi/scsi_cmnd.h> |
40 | #include <scsi/scsi_device.h> |
41 | #include <scsi/scsi_host.h> |
42 | #include <scsi/scsi.h> |
43 | #include <scsi/scsi_transport_iscsi.h> |
44 | |
45 | #include "iscsi_tcp.h" |
46 | |
47 | MODULE_AUTHOR("Mike Christie <michaelc@cs.wisc.edu>, " |
48 | "Dmitry Yusupov <dmitry_yus@yahoo.com>, " |
49 | "Alex Aizman <itn780@yahoo.com>"); |
50 | MODULE_DESCRIPTION("iSCSI/TCP data-path"); |
51 | MODULE_LICENSE("GPL"); |
52 | |
53 | static struct scsi_transport_template *iscsi_sw_tcp_scsi_transport; |
54 | static struct scsi_host_template iscsi_sw_tcp_sht; |
55 | static struct iscsi_transport iscsi_sw_tcp_transport; |
56 | |
57 | static unsigned int iscsi_max_lun = 512; |
58 | module_param_named(max_lun, iscsi_max_lun, uint, S_IRUGO); |
59 | |
60 | static int iscsi_sw_tcp_dbg; |
61 | module_param_named(debug_iscsi_tcp, iscsi_sw_tcp_dbg, int, |
62 | S_IRUGO | S_IWUSR); |
63 | MODULE_PARM_DESC(debug_iscsi_tcp, "Turn on debugging for iscsi_tcp module " |
64 | "Set to 1 to turn on, and zero to turn off. Default is off."); |
65 | |
66 | #define ISCSI_SW_TCP_DBG(_conn, dbg_fmt, arg...) \ |
67 | do { \ |
68 | if (iscsi_sw_tcp_dbg) \ |
69 | iscsi_conn_printk(KERN_INFO, _conn, \ |
70 | "%s " dbg_fmt, \ |
71 | __func__, ##arg); \ |
72 | } while (0); |
73 | |
74 | |
75 | /** |
76 | * iscsi_sw_tcp_recv - TCP receive in sendfile fashion |
77 | * @rd_desc: read descriptor |
78 | * @skb: socket buffer |
79 | * @offset: offset in skb |
80 | * @len: skb->len - offset |
81 | */ |
82 | static int iscsi_sw_tcp_recv(read_descriptor_t *rd_desc, struct sk_buff *skb, |
83 | unsigned int offset, size_t len) |
84 | { |
85 | struct iscsi_conn *conn = rd_desc->arg.data; |
86 | unsigned int consumed, total_consumed = 0; |
87 | int status; |
88 | |
89 | ISCSI_SW_TCP_DBG(conn, "in %d bytes\n", skb->len - offset); |
90 | |
91 | do { |
92 | status = 0; |
93 | consumed = iscsi_tcp_recv_skb(conn, skb, offset, 0, &status); |
94 | offset += consumed; |
95 | total_consumed += consumed; |
96 | } while (consumed != 0 && status != ISCSI_TCP_SKB_DONE); |
97 | |
98 | ISCSI_SW_TCP_DBG(conn, "read %d bytes status %d\n", |
99 | skb->len - offset, status); |
100 | return total_consumed; |
101 | } |
102 | |
103 | /** |
104 | * iscsi_sw_sk_state_check - check socket state |
105 | * @sk: socket |
106 | * |
107 | * If the socket is in CLOSE or CLOSE_WAIT we should |
108 | * not close the connection if there is still some |
109 | * data pending. |
110 | */ |
111 | static inline int iscsi_sw_sk_state_check(struct sock *sk) |
112 | { |
113 | struct iscsi_conn *conn = (struct iscsi_conn*)sk->sk_user_data; |
114 | |
115 | if ((sk->sk_state == TCP_CLOSE_WAIT || sk->sk_state == TCP_CLOSE) && |
116 | !atomic_read(&sk->sk_rmem_alloc)) { |
117 | ISCSI_SW_TCP_DBG(conn, "TCP_CLOSE|TCP_CLOSE_WAIT\n"); |
118 | iscsi_conn_failure(conn, ISCSI_ERR_TCP_CONN_CLOSE); |
119 | return -ECONNRESET; |
120 | } |
121 | return 0; |
122 | } |
123 | |
124 | static void iscsi_sw_tcp_data_ready(struct sock *sk, int flag) |
125 | { |
126 | struct iscsi_conn *conn = sk->sk_user_data; |
127 | struct iscsi_tcp_conn *tcp_conn = conn->dd_data; |
128 | read_descriptor_t rd_desc; |
129 | |
130 | read_lock(&sk->sk_callback_lock); |
131 | |
132 | /* |
133 | * Use rd_desc to pass 'conn' to iscsi_tcp_recv. |
134 | * We set count to 1 because we want the network layer to |
135 | * hand us all the skbs that are available. iscsi_tcp_recv |
136 | * handled pdus that cross buffers or pdus that still need data. |
137 | */ |
138 | rd_desc.arg.data = conn; |
139 | rd_desc.count = 1; |
140 | tcp_read_sock(sk, &rd_desc, iscsi_sw_tcp_recv); |
141 | |
142 | iscsi_sw_sk_state_check(sk); |
143 | |
144 | read_unlock(&sk->sk_callback_lock); |
145 | |
146 | /* If we had to (atomically) map a highmem page, |
147 | * unmap it now. */ |
148 | iscsi_tcp_segment_unmap(&tcp_conn->in.segment); |
149 | } |
150 | |
151 | static void iscsi_sw_tcp_state_change(struct sock *sk) |
152 | { |
153 | struct iscsi_tcp_conn *tcp_conn; |
154 | struct iscsi_sw_tcp_conn *tcp_sw_conn; |
155 | struct iscsi_conn *conn; |
156 | struct iscsi_session *session; |
157 | void (*old_state_change)(struct sock *); |
158 | |
159 | read_lock(&sk->sk_callback_lock); |
160 | |
161 | conn = (struct iscsi_conn*)sk->sk_user_data; |
162 | session = conn->session; |
163 | |
164 | iscsi_sw_sk_state_check(sk); |
165 | |
166 | tcp_conn = conn->dd_data; |
167 | tcp_sw_conn = tcp_conn->dd_data; |
168 | old_state_change = tcp_sw_conn->old_state_change; |
169 | |
170 | read_unlock(&sk->sk_callback_lock); |
171 | |
172 | old_state_change(sk); |
173 | } |
174 | |
175 | /** |
176 | * iscsi_write_space - Called when more output buffer space is available |
177 | * @sk: socket space is available for |
178 | **/ |
179 | static void iscsi_sw_tcp_write_space(struct sock *sk) |
180 | { |
181 | struct iscsi_conn *conn = (struct iscsi_conn*)sk->sk_user_data; |
182 | struct iscsi_tcp_conn *tcp_conn = conn->dd_data; |
183 | struct iscsi_sw_tcp_conn *tcp_sw_conn = tcp_conn->dd_data; |
184 | |
185 | tcp_sw_conn->old_write_space(sk); |
186 | ISCSI_SW_TCP_DBG(conn, "iscsi_write_space\n"); |
187 | iscsi_conn_queue_work(conn); |
188 | } |
189 | |
190 | static void iscsi_sw_tcp_conn_set_callbacks(struct iscsi_conn *conn) |
191 | { |
192 | struct iscsi_tcp_conn *tcp_conn = conn->dd_data; |
193 | struct iscsi_sw_tcp_conn *tcp_sw_conn = tcp_conn->dd_data; |
194 | struct sock *sk = tcp_sw_conn->sock->sk; |
195 | |
196 | /* assign new callbacks */ |
197 | write_lock_bh(&sk->sk_callback_lock); |
198 | sk->sk_user_data = conn; |
199 | tcp_sw_conn->old_data_ready = sk->sk_data_ready; |
200 | tcp_sw_conn->old_state_change = sk->sk_state_change; |
201 | tcp_sw_conn->old_write_space = sk->sk_write_space; |
202 | sk->sk_data_ready = iscsi_sw_tcp_data_ready; |
203 | sk->sk_state_change = iscsi_sw_tcp_state_change; |
204 | sk->sk_write_space = iscsi_sw_tcp_write_space; |
205 | write_unlock_bh(&sk->sk_callback_lock); |
206 | } |
207 | |
208 | static void |
209 | iscsi_sw_tcp_conn_restore_callbacks(struct iscsi_sw_tcp_conn *tcp_sw_conn) |
210 | { |
211 | struct sock *sk = tcp_sw_conn->sock->sk; |
212 | |
213 | /* restore socket callbacks, see also: iscsi_conn_set_callbacks() */ |
214 | write_lock_bh(&sk->sk_callback_lock); |
215 | sk->sk_user_data = NULL; |
216 | sk->sk_data_ready = tcp_sw_conn->old_data_ready; |
217 | sk->sk_state_change = tcp_sw_conn->old_state_change; |
218 | sk->sk_write_space = tcp_sw_conn->old_write_space; |
219 | sk->sk_no_check = 0; |
220 | write_unlock_bh(&sk->sk_callback_lock); |
221 | } |
222 | |
223 | /** |
224 | * iscsi_sw_tcp_xmit_segment - transmit segment |
225 | * @tcp_conn: the iSCSI TCP connection |
226 | * @segment: the buffer to transmnit |
227 | * |
228 | * This function transmits as much of the buffer as |
229 | * the network layer will accept, and returns the number of |
230 | * bytes transmitted. |
231 | * |
232 | * If CRC hashing is enabled, the function will compute the |
233 | * hash as it goes. When the entire segment has been transmitted, |
234 | * it will retrieve the hash value and send it as well. |
235 | */ |
236 | static int iscsi_sw_tcp_xmit_segment(struct iscsi_tcp_conn *tcp_conn, |
237 | struct iscsi_segment *segment) |
238 | { |
239 | struct iscsi_sw_tcp_conn *tcp_sw_conn = tcp_conn->dd_data; |
240 | struct socket *sk = tcp_sw_conn->sock; |
241 | unsigned int copied = 0; |
242 | int r = 0; |
243 | |
244 | while (!iscsi_tcp_segment_done(tcp_conn, segment, 0, r)) { |
245 | struct scatterlist *sg; |
246 | unsigned int offset, copy; |
247 | int flags = 0; |
248 | |
249 | r = 0; |
250 | offset = segment->copied; |
251 | copy = segment->size - offset; |
252 | |
253 | if (segment->total_copied + segment->size < segment->total_size) |
254 | flags |= MSG_MORE; |
255 | |
256 | /* Use sendpage if we can; else fall back to sendmsg */ |
257 | if (!segment->data) { |
258 | sg = segment->sg; |
259 | offset += segment->sg_offset + sg->offset; |
260 | r = tcp_sw_conn->sendpage(sk, sg_page(sg), offset, |
261 | copy, flags); |
262 | } else { |
263 | struct msghdr msg = { .msg_flags = flags }; |
264 | struct kvec iov = { |
265 | .iov_base = segment->data + offset, |
266 | .iov_len = copy |
267 | }; |
268 | |
269 | r = kernel_sendmsg(sk, &msg, &iov, 1, copy); |
270 | } |
271 | |
272 | if (r < 0) { |
273 | iscsi_tcp_segment_unmap(segment); |
274 | return r; |
275 | } |
276 | copied += r; |
277 | } |
278 | return copied; |
279 | } |
280 | |
281 | /** |
282 | * iscsi_sw_tcp_xmit - TCP transmit |
283 | **/ |
284 | static int iscsi_sw_tcp_xmit(struct iscsi_conn *conn) |
285 | { |
286 | struct iscsi_tcp_conn *tcp_conn = conn->dd_data; |
287 | struct iscsi_sw_tcp_conn *tcp_sw_conn = tcp_conn->dd_data; |
288 | struct iscsi_segment *segment = &tcp_sw_conn->out.segment; |
289 | unsigned int consumed = 0; |
290 | int rc = 0; |
291 | |
292 | while (1) { |
293 | rc = iscsi_sw_tcp_xmit_segment(tcp_conn, segment); |
294 | /* |
295 | * We may not have been able to send data because the conn |
296 | * is getting stopped. libiscsi will know so propogate err |
297 | * for it to do the right thing. |
298 | */ |
299 | if (rc == -EAGAIN) |
300 | return rc; |
301 | else if (rc < 0) { |
302 | rc = ISCSI_ERR_XMIT_FAILED; |
303 | goto error; |
304 | } else if (rc == 0) |
305 | break; |
306 | |
307 | consumed += rc; |
308 | |
309 | if (segment->total_copied >= segment->total_size) { |
310 | if (segment->done != NULL) { |
311 | rc = segment->done(tcp_conn, segment); |
312 | if (rc != 0) |
313 | goto error; |
314 | } |
315 | } |
316 | } |
317 | |
318 | ISCSI_SW_TCP_DBG(conn, "xmit %d bytes\n", consumed); |
319 | |
320 | conn->txdata_octets += consumed; |
321 | return consumed; |
322 | |
323 | error: |
324 | /* Transmit error. We could initiate error recovery |
325 | * here. */ |
326 | ISCSI_SW_TCP_DBG(conn, "Error sending PDU, errno=%d\n", rc); |
327 | iscsi_conn_failure(conn, rc); |
328 | return -EIO; |
329 | } |
330 | |
331 | /** |
332 | * iscsi_tcp_xmit_qlen - return the number of bytes queued for xmit |
333 | */ |
334 | static inline int iscsi_sw_tcp_xmit_qlen(struct iscsi_conn *conn) |
335 | { |
336 | struct iscsi_tcp_conn *tcp_conn = conn->dd_data; |
337 | struct iscsi_sw_tcp_conn *tcp_sw_conn = tcp_conn->dd_data; |
338 | struct iscsi_segment *segment = &tcp_sw_conn->out.segment; |
339 | |
340 | return segment->total_copied - segment->total_size; |
341 | } |
342 | |
343 | static int iscsi_sw_tcp_pdu_xmit(struct iscsi_task *task) |
344 | { |
345 | struct iscsi_conn *conn = task->conn; |
346 | int rc; |
347 | |
348 | while (iscsi_sw_tcp_xmit_qlen(conn)) { |
349 | rc = iscsi_sw_tcp_xmit(conn); |
350 | if (rc == 0) |
351 | return -EAGAIN; |
352 | if (rc < 0) |
353 | return rc; |
354 | } |
355 | |
356 | return 0; |
357 | } |
358 | |
359 | /* |
360 | * This is called when we're done sending the header. |
361 | * Simply copy the data_segment to the send segment, and return. |
362 | */ |
363 | static int iscsi_sw_tcp_send_hdr_done(struct iscsi_tcp_conn *tcp_conn, |
364 | struct iscsi_segment *segment) |
365 | { |
366 | struct iscsi_sw_tcp_conn *tcp_sw_conn = tcp_conn->dd_data; |
367 | |
368 | tcp_sw_conn->out.segment = tcp_sw_conn->out.data_segment; |
369 | ISCSI_SW_TCP_DBG(tcp_conn->iscsi_conn, |
370 | "Header done. Next segment size %u total_size %u\n", |
371 | tcp_sw_conn->out.segment.size, |
372 | tcp_sw_conn->out.segment.total_size); |
373 | return 0; |
374 | } |
375 | |
376 | static void iscsi_sw_tcp_send_hdr_prep(struct iscsi_conn *conn, void *hdr, |
377 | size_t hdrlen) |
378 | { |
379 | struct iscsi_tcp_conn *tcp_conn = conn->dd_data; |
380 | struct iscsi_sw_tcp_conn *tcp_sw_conn = tcp_conn->dd_data; |
381 | |
382 | ISCSI_SW_TCP_DBG(conn, "%s\n", conn->hdrdgst_en ? |
383 | "digest enabled" : "digest disabled"); |
384 | |
385 | /* Clear the data segment - needs to be filled in by the |
386 | * caller using iscsi_tcp_send_data_prep() */ |
387 | memset(&tcp_sw_conn->out.data_segment, 0, |
388 | sizeof(struct iscsi_segment)); |
389 | |
390 | /* If header digest is enabled, compute the CRC and |
391 | * place the digest into the same buffer. We make |
392 | * sure that both iscsi_tcp_task and mtask have |
393 | * sufficient room. |
394 | */ |
395 | if (conn->hdrdgst_en) { |
396 | iscsi_tcp_dgst_header(&tcp_sw_conn->tx_hash, hdr, hdrlen, |
397 | hdr + hdrlen); |
398 | hdrlen += ISCSI_DIGEST_SIZE; |
399 | } |
400 | |
401 | /* Remember header pointer for later, when we need |
402 | * to decide whether there's a payload to go along |
403 | * with the header. */ |
404 | tcp_sw_conn->out.hdr = hdr; |
405 | |
406 | iscsi_segment_init_linear(&tcp_sw_conn->out.segment, hdr, hdrlen, |
407 | iscsi_sw_tcp_send_hdr_done, NULL); |
408 | } |
409 | |
410 | /* |
411 | * Prepare the send buffer for the payload data. |
412 | * Padding and checksumming will all be taken care |
413 | * of by the iscsi_segment routines. |
414 | */ |
415 | static int |
416 | iscsi_sw_tcp_send_data_prep(struct iscsi_conn *conn, struct scatterlist *sg, |
417 | unsigned int count, unsigned int offset, |
418 | unsigned int len) |
419 | { |
420 | struct iscsi_tcp_conn *tcp_conn = conn->dd_data; |
421 | struct iscsi_sw_tcp_conn *tcp_sw_conn = tcp_conn->dd_data; |
422 | struct hash_desc *tx_hash = NULL; |
423 | unsigned int hdr_spec_len; |
424 | |
425 | ISCSI_SW_TCP_DBG(conn, "offset=%d, datalen=%d %s\n", offset, len, |
426 | conn->datadgst_en ? |
427 | "digest enabled" : "digest disabled"); |
428 | |
429 | /* Make sure the datalen matches what the caller |
430 | said he would send. */ |
431 | hdr_spec_len = ntoh24(tcp_sw_conn->out.hdr->dlength); |
432 | WARN_ON(iscsi_padded(len) != iscsi_padded(hdr_spec_len)); |
433 | |
434 | if (conn->datadgst_en) |
435 | tx_hash = &tcp_sw_conn->tx_hash; |
436 | |
437 | return iscsi_segment_seek_sg(&tcp_sw_conn->out.data_segment, |
438 | sg, count, offset, len, |
439 | NULL, tx_hash); |
440 | } |
441 | |
442 | static void |
443 | iscsi_sw_tcp_send_linear_data_prep(struct iscsi_conn *conn, void *data, |
444 | size_t len) |
445 | { |
446 | struct iscsi_tcp_conn *tcp_conn = conn->dd_data; |
447 | struct iscsi_sw_tcp_conn *tcp_sw_conn = tcp_conn->dd_data; |
448 | struct hash_desc *tx_hash = NULL; |
449 | unsigned int hdr_spec_len; |
450 | |
451 | ISCSI_SW_TCP_DBG(conn, "datalen=%zd %s\n", len, conn->datadgst_en ? |
452 | "digest enabled" : "digest disabled"); |
453 | |
454 | /* Make sure the datalen matches what the caller |
455 | said he would send. */ |
456 | hdr_spec_len = ntoh24(tcp_sw_conn->out.hdr->dlength); |
457 | WARN_ON(iscsi_padded(len) != iscsi_padded(hdr_spec_len)); |
458 | |
459 | if (conn->datadgst_en) |
460 | tx_hash = &tcp_sw_conn->tx_hash; |
461 | |
462 | iscsi_segment_init_linear(&tcp_sw_conn->out.data_segment, |
463 | data, len, NULL, tx_hash); |
464 | } |
465 | |
466 | static int iscsi_sw_tcp_pdu_init(struct iscsi_task *task, |
467 | unsigned int offset, unsigned int count) |
468 | { |
469 | struct iscsi_conn *conn = task->conn; |
470 | int err = 0; |
471 | |
472 | iscsi_sw_tcp_send_hdr_prep(conn, task->hdr, task->hdr_len); |
473 | |
474 | if (!count) |
475 | return 0; |
476 | |
477 | if (!task->sc) |
478 | iscsi_sw_tcp_send_linear_data_prep(conn, task->data, count); |
479 | else { |
480 | struct scsi_data_buffer *sdb = scsi_out(task->sc); |
481 | |
482 | err = iscsi_sw_tcp_send_data_prep(conn, sdb->table.sgl, |
483 | sdb->table.nents, offset, |
484 | count); |
485 | } |
486 | |
487 | if (err) { |
488 | /* got invalid offset/len */ |
489 | return -EIO; |
490 | } |
491 | return 0; |
492 | } |
493 | |
494 | static int iscsi_sw_tcp_pdu_alloc(struct iscsi_task *task, uint8_t opcode) |
495 | { |
496 | struct iscsi_tcp_task *tcp_task = task->dd_data; |
497 | |
498 | task->hdr = task->dd_data + sizeof(*tcp_task); |
499 | task->hdr_max = sizeof(struct iscsi_sw_tcp_hdrbuf) - ISCSI_DIGEST_SIZE; |
500 | return 0; |
501 | } |
502 | |
503 | static struct iscsi_cls_conn * |
504 | iscsi_sw_tcp_conn_create(struct iscsi_cls_session *cls_session, |
505 | uint32_t conn_idx) |
506 | { |
507 | struct iscsi_conn *conn; |
508 | struct iscsi_cls_conn *cls_conn; |
509 | struct iscsi_tcp_conn *tcp_conn; |
510 | struct iscsi_sw_tcp_conn *tcp_sw_conn; |
511 | |
512 | cls_conn = iscsi_tcp_conn_setup(cls_session, sizeof(*tcp_sw_conn), |
513 | conn_idx); |
514 | if (!cls_conn) |
515 | return NULL; |
516 | conn = cls_conn->dd_data; |
517 | tcp_conn = conn->dd_data; |
518 | tcp_sw_conn = tcp_conn->dd_data; |
519 | |
520 | tcp_sw_conn->tx_hash.tfm = crypto_alloc_hash("crc32c", 0, |
521 | CRYPTO_ALG_ASYNC); |
522 | tcp_sw_conn->tx_hash.flags = 0; |
523 | if (IS_ERR(tcp_sw_conn->tx_hash.tfm)) |
524 | goto free_conn; |
525 | |
526 | tcp_sw_conn->rx_hash.tfm = crypto_alloc_hash("crc32c", 0, |
527 | CRYPTO_ALG_ASYNC); |
528 | tcp_sw_conn->rx_hash.flags = 0; |
529 | if (IS_ERR(tcp_sw_conn->rx_hash.tfm)) |
530 | goto free_tx_tfm; |
531 | tcp_conn->rx_hash = &tcp_sw_conn->rx_hash; |
532 | |
533 | return cls_conn; |
534 | |
535 | free_tx_tfm: |
536 | crypto_free_hash(tcp_sw_conn->tx_hash.tfm); |
537 | free_conn: |
538 | iscsi_conn_printk(KERN_ERR, conn, |
539 | "Could not create connection due to crc32c " |
540 | "loading error. Make sure the crc32c " |
541 | "module is built as a module or into the " |
542 | "kernel\n"); |
543 | iscsi_tcp_conn_teardown(cls_conn); |
544 | return NULL; |
545 | } |
546 | |
547 | static void iscsi_sw_tcp_release_conn(struct iscsi_conn *conn) |
548 | { |
549 | struct iscsi_session *session = conn->session; |
550 | struct iscsi_tcp_conn *tcp_conn = conn->dd_data; |
551 | struct iscsi_sw_tcp_conn *tcp_sw_conn = tcp_conn->dd_data; |
552 | struct socket *sock = tcp_sw_conn->sock; |
553 | |
554 | if (!sock) |
555 | return; |
556 | |
557 | sock_hold(sock->sk); |
558 | iscsi_sw_tcp_conn_restore_callbacks(tcp_sw_conn); |
559 | sock_put(sock->sk); |
560 | |
561 | spin_lock_bh(&session->lock); |
562 | tcp_sw_conn->sock = NULL; |
563 | spin_unlock_bh(&session->lock); |
564 | sockfd_put(sock); |
565 | } |
566 | |
567 | static void iscsi_sw_tcp_conn_destroy(struct iscsi_cls_conn *cls_conn) |
568 | { |
569 | struct iscsi_conn *conn = cls_conn->dd_data; |
570 | struct iscsi_tcp_conn *tcp_conn = conn->dd_data; |
571 | struct iscsi_sw_tcp_conn *tcp_sw_conn = tcp_conn->dd_data; |
572 | |
573 | iscsi_sw_tcp_release_conn(conn); |
574 | |
575 | if (tcp_sw_conn->tx_hash.tfm) |
576 | crypto_free_hash(tcp_sw_conn->tx_hash.tfm); |
577 | if (tcp_sw_conn->rx_hash.tfm) |
578 | crypto_free_hash(tcp_sw_conn->rx_hash.tfm); |
579 | |
580 | iscsi_tcp_conn_teardown(cls_conn); |
581 | } |
582 | |
583 | static void iscsi_sw_tcp_conn_stop(struct iscsi_cls_conn *cls_conn, int flag) |
584 | { |
585 | struct iscsi_conn *conn = cls_conn->dd_data; |
586 | struct iscsi_tcp_conn *tcp_conn = conn->dd_data; |
587 | struct iscsi_sw_tcp_conn *tcp_sw_conn = tcp_conn->dd_data; |
588 | struct socket *sock = tcp_sw_conn->sock; |
589 | |
590 | /* userspace may have goofed up and not bound us */ |
591 | if (!sock) |
592 | return; |
593 | /* |
594 | * Make sure our recv side is stopped. |
595 | * Older tools called conn stop before ep_disconnect |
596 | * so IO could still be coming in. |
597 | */ |
598 | write_lock_bh(&tcp_sw_conn->sock->sk->sk_callback_lock); |
599 | set_bit(ISCSI_SUSPEND_BIT, &conn->suspend_rx); |
600 | write_unlock_bh(&tcp_sw_conn->sock->sk->sk_callback_lock); |
601 | |
602 | if (sock->sk->sk_sleep) { |
603 | sock->sk->sk_err = EIO; |
604 | wake_up_interruptible(sock->sk->sk_sleep); |
605 | } |
606 | |
607 | iscsi_conn_stop(cls_conn, flag); |
608 | iscsi_sw_tcp_release_conn(conn); |
609 | } |
610 | |
611 | static int iscsi_sw_tcp_get_addr(struct iscsi_conn *conn, struct socket *sock, |
612 | char *buf, int *port, |
613 | int (*getname)(struct socket *, |
614 | struct sockaddr *, |
615 | int *addrlen)) |
616 | { |
617 | struct sockaddr_storage *addr; |
618 | struct sockaddr_in6 *sin6; |
619 | struct sockaddr_in *sin; |
620 | int rc = 0, len; |
621 | |
622 | addr = kmalloc(sizeof(*addr), GFP_KERNEL); |
623 | if (!addr) |
624 | return -ENOMEM; |
625 | |
626 | if (getname(sock, (struct sockaddr *) addr, &len)) { |
627 | rc = -ENODEV; |
628 | goto free_addr; |
629 | } |
630 | |
631 | switch (addr->ss_family) { |
632 | case AF_INET: |
633 | sin = (struct sockaddr_in *)addr; |
634 | spin_lock_bh(&conn->session->lock); |
635 | sprintf(buf, "%pI4", &sin->sin_addr.s_addr); |
636 | *port = be16_to_cpu(sin->sin_port); |
637 | spin_unlock_bh(&conn->session->lock); |
638 | break; |
639 | case AF_INET6: |
640 | sin6 = (struct sockaddr_in6 *)addr; |
641 | spin_lock_bh(&conn->session->lock); |
642 | sprintf(buf, "%pI6", &sin6->sin6_addr); |
643 | *port = be16_to_cpu(sin6->sin6_port); |
644 | spin_unlock_bh(&conn->session->lock); |
645 | break; |
646 | } |
647 | free_addr: |
648 | kfree(addr); |
649 | return rc; |
650 | } |
651 | |
652 | static int |
653 | iscsi_sw_tcp_conn_bind(struct iscsi_cls_session *cls_session, |
654 | struct iscsi_cls_conn *cls_conn, uint64_t transport_eph, |
655 | int is_leading) |
656 | { |
657 | struct Scsi_Host *shost = iscsi_session_to_shost(cls_session); |
658 | struct iscsi_host *ihost = shost_priv(shost); |
659 | struct iscsi_conn *conn = cls_conn->dd_data; |
660 | struct iscsi_tcp_conn *tcp_conn = conn->dd_data; |
661 | struct iscsi_sw_tcp_conn *tcp_sw_conn = tcp_conn->dd_data; |
662 | struct sock *sk; |
663 | struct socket *sock; |
664 | int err; |
665 | |
666 | /* lookup for existing socket */ |
667 | sock = sockfd_lookup((int)transport_eph, &err); |
668 | if (!sock) { |
669 | iscsi_conn_printk(KERN_ERR, conn, |
670 | "sockfd_lookup failed %d\n", err); |
671 | return -EEXIST; |
672 | } |
673 | /* |
674 | * copy these values now because if we drop the session |
675 | * userspace may still want to query the values since we will |
676 | * be using them for the reconnect |
677 | */ |
678 | err = iscsi_sw_tcp_get_addr(conn, sock, conn->portal_address, |
679 | &conn->portal_port, kernel_getpeername); |
680 | if (err) |
681 | goto free_socket; |
682 | |
683 | err = iscsi_sw_tcp_get_addr(conn, sock, ihost->local_address, |
684 | &ihost->local_port, kernel_getsockname); |
685 | if (err) |
686 | goto free_socket; |
687 | |
688 | err = iscsi_conn_bind(cls_session, cls_conn, is_leading); |
689 | if (err) |
690 | goto free_socket; |
691 | |
692 | /* bind iSCSI connection and socket */ |
693 | tcp_sw_conn->sock = sock; |
694 | |
695 | /* setup Socket parameters */ |
696 | sk = sock->sk; |
697 | sk->sk_reuse = 1; |
698 | sk->sk_sndtimeo = 15 * HZ; /* FIXME: make it configurable */ |
699 | sk->sk_allocation = GFP_ATOMIC; |
700 | |
701 | iscsi_sw_tcp_conn_set_callbacks(conn); |
702 | tcp_sw_conn->sendpage = tcp_sw_conn->sock->ops->sendpage; |
703 | /* |
704 | * set receive state machine into initial state |
705 | */ |
706 | iscsi_tcp_hdr_recv_prep(tcp_conn); |
707 | return 0; |
708 | |
709 | free_socket: |
710 | sockfd_put(sock); |
711 | return err; |
712 | } |
713 | |
714 | static int iscsi_sw_tcp_conn_set_param(struct iscsi_cls_conn *cls_conn, |
715 | enum iscsi_param param, char *buf, |
716 | int buflen) |
717 | { |
718 | struct iscsi_conn *conn = cls_conn->dd_data; |
719 | struct iscsi_session *session = conn->session; |
720 | struct iscsi_tcp_conn *tcp_conn = conn->dd_data; |
721 | struct iscsi_sw_tcp_conn *tcp_sw_conn = tcp_conn->dd_data; |
722 | int value; |
723 | |
724 | switch(param) { |
725 | case ISCSI_PARAM_HDRDGST_EN: |
726 | iscsi_set_param(cls_conn, param, buf, buflen); |
727 | break; |
728 | case ISCSI_PARAM_DATADGST_EN: |
729 | iscsi_set_param(cls_conn, param, buf, buflen); |
730 | tcp_sw_conn->sendpage = conn->datadgst_en ? |
731 | sock_no_sendpage : tcp_sw_conn->sock->ops->sendpage; |
732 | break; |
733 | case ISCSI_PARAM_MAX_R2T: |
734 | sscanf(buf, "%d", &value); |
735 | if (value <= 0 || !is_power_of_2(value)) |
736 | return -EINVAL; |
737 | if (session->max_r2t == value) |
738 | break; |
739 | iscsi_tcp_r2tpool_free(session); |
740 | iscsi_set_param(cls_conn, param, buf, buflen); |
741 | if (iscsi_tcp_r2tpool_alloc(session)) |
742 | return -ENOMEM; |
743 | break; |
744 | default: |
745 | return iscsi_set_param(cls_conn, param, buf, buflen); |
746 | } |
747 | |
748 | return 0; |
749 | } |
750 | |
751 | static int iscsi_sw_tcp_conn_get_param(struct iscsi_cls_conn *cls_conn, |
752 | enum iscsi_param param, char *buf) |
753 | { |
754 | struct iscsi_conn *conn = cls_conn->dd_data; |
755 | int len; |
756 | |
757 | switch(param) { |
758 | case ISCSI_PARAM_CONN_PORT: |
759 | spin_lock_bh(&conn->session->lock); |
760 | len = sprintf(buf, "%hu\n", conn->portal_port); |
761 | spin_unlock_bh(&conn->session->lock); |
762 | break; |
763 | case ISCSI_PARAM_CONN_ADDRESS: |
764 | spin_lock_bh(&conn->session->lock); |
765 | len = sprintf(buf, "%s\n", conn->portal_address); |
766 | spin_unlock_bh(&conn->session->lock); |
767 | break; |
768 | default: |
769 | return iscsi_conn_get_param(cls_conn, param, buf); |
770 | } |
771 | |
772 | return len; |
773 | } |
774 | |
775 | static void |
776 | iscsi_sw_tcp_conn_get_stats(struct iscsi_cls_conn *cls_conn, |
777 | struct iscsi_stats *stats) |
778 | { |
779 | struct iscsi_conn *conn = cls_conn->dd_data; |
780 | struct iscsi_tcp_conn *tcp_conn = conn->dd_data; |
781 | struct iscsi_sw_tcp_conn *tcp_sw_conn = tcp_conn->dd_data; |
782 | |
783 | stats->custom_length = 3; |
784 | strcpy(stats->custom[0].desc, "tx_sendpage_failures"); |
785 | stats->custom[0].value = tcp_sw_conn->sendpage_failures_cnt; |
786 | strcpy(stats->custom[1].desc, "rx_discontiguous_hdr"); |
787 | stats->custom[1].value = tcp_sw_conn->discontiguous_hdr_cnt; |
788 | strcpy(stats->custom[2].desc, "eh_abort_cnt"); |
789 | stats->custom[2].value = conn->eh_abort_cnt; |
790 | |
791 | iscsi_tcp_conn_get_stats(cls_conn, stats); |
792 | } |
793 | |
794 | static struct iscsi_cls_session * |
795 | iscsi_sw_tcp_session_create(struct iscsi_endpoint *ep, uint16_t cmds_max, |
796 | uint16_t qdepth, uint32_t initial_cmdsn) |
797 | { |
798 | struct iscsi_cls_session *cls_session; |
799 | struct iscsi_session *session; |
800 | struct Scsi_Host *shost; |
801 | |
802 | if (ep) { |
803 | printk(KERN_ERR "iscsi_tcp: invalid ep %p.\n", ep); |
804 | return NULL; |
805 | } |
806 | |
807 | shost = iscsi_host_alloc(&iscsi_sw_tcp_sht, 0, 1); |
808 | if (!shost) |
809 | return NULL; |
810 | shost->transportt = iscsi_sw_tcp_scsi_transport; |
811 | shost->cmd_per_lun = qdepth; |
812 | shost->max_lun = iscsi_max_lun; |
813 | shost->max_id = 0; |
814 | shost->max_channel = 0; |
815 | shost->max_cmd_len = SCSI_MAX_VARLEN_CDB_SIZE; |
816 | |
817 | if (iscsi_host_add(shost, NULL)) |
818 | goto free_host; |
819 | |
820 | cls_session = iscsi_session_setup(&iscsi_sw_tcp_transport, shost, |
821 | cmds_max, 0, |
822 | sizeof(struct iscsi_tcp_task) + |
823 | sizeof(struct iscsi_sw_tcp_hdrbuf), |
824 | initial_cmdsn, 0); |
825 | if (!cls_session) |
826 | goto remove_host; |
827 | session = cls_session->dd_data; |
828 | |
829 | shost->can_queue = session->scsi_cmds_max; |
830 | if (iscsi_tcp_r2tpool_alloc(session)) |
831 | goto remove_session; |
832 | return cls_session; |
833 | |
834 | remove_session: |
835 | iscsi_session_teardown(cls_session); |
836 | remove_host: |
837 | iscsi_host_remove(shost); |
838 | free_host: |
839 | iscsi_host_free(shost); |
840 | return NULL; |
841 | } |
842 | |
843 | static void iscsi_sw_tcp_session_destroy(struct iscsi_cls_session *cls_session) |
844 | { |
845 | struct Scsi_Host *shost = iscsi_session_to_shost(cls_session); |
846 | |
847 | iscsi_tcp_r2tpool_free(cls_session->dd_data); |
848 | iscsi_session_teardown(cls_session); |
849 | |
850 | iscsi_host_remove(shost); |
851 | iscsi_host_free(shost); |
852 | } |
853 | |
854 | static int iscsi_sw_tcp_slave_alloc(struct scsi_device *sdev) |
855 | { |
856 | set_bit(QUEUE_FLAG_BIDI, &sdev->request_queue->queue_flags); |
857 | return 0; |
858 | } |
859 | |
860 | static int iscsi_sw_tcp_slave_configure(struct scsi_device *sdev) |
861 | { |
862 | blk_queue_bounce_limit(sdev->request_queue, BLK_BOUNCE_ANY); |
863 | blk_queue_dma_alignment(sdev->request_queue, 0); |
864 | return 0; |
865 | } |
866 | |
867 | static struct scsi_host_template iscsi_sw_tcp_sht = { |
868 | .module = THIS_MODULE, |
869 | .name = "iSCSI Initiator over TCP/IP", |
870 | .queuecommand = iscsi_queuecommand, |
871 | .change_queue_depth = iscsi_change_queue_depth, |
872 | .can_queue = ISCSI_DEF_XMIT_CMDS_MAX - 1, |
873 | .sg_tablesize = 4096, |
874 | .max_sectors = 0xFFFF, |
875 | .cmd_per_lun = ISCSI_DEF_CMD_PER_LUN, |
876 | .eh_abort_handler = iscsi_eh_abort, |
877 | .eh_device_reset_handler= iscsi_eh_device_reset, |
878 | .eh_target_reset_handler = iscsi_eh_recover_target, |
879 | .use_clustering = DISABLE_CLUSTERING, |
880 | .slave_alloc = iscsi_sw_tcp_slave_alloc, |
881 | .slave_configure = iscsi_sw_tcp_slave_configure, |
882 | .target_alloc = iscsi_target_alloc, |
883 | .proc_name = "iscsi_tcp", |
884 | .this_id = -1, |
885 | }; |
886 | |
887 | static struct iscsi_transport iscsi_sw_tcp_transport = { |
888 | .owner = THIS_MODULE, |
889 | .name = "tcp", |
890 | .caps = CAP_RECOVERY_L0 | CAP_MULTI_R2T | CAP_HDRDGST |
891 | | CAP_DATADGST, |
892 | .param_mask = ISCSI_MAX_RECV_DLENGTH | |
893 | ISCSI_MAX_XMIT_DLENGTH | |
894 | ISCSI_HDRDGST_EN | |
895 | ISCSI_DATADGST_EN | |
896 | ISCSI_INITIAL_R2T_EN | |
897 | ISCSI_MAX_R2T | |
898 | ISCSI_IMM_DATA_EN | |
899 | ISCSI_FIRST_BURST | |
900 | ISCSI_MAX_BURST | |
901 | ISCSI_PDU_INORDER_EN | |
902 | ISCSI_DATASEQ_INORDER_EN | |
903 | ISCSI_ERL | |
904 | ISCSI_CONN_PORT | |
905 | ISCSI_CONN_ADDRESS | |
906 | ISCSI_EXP_STATSN | |
907 | ISCSI_PERSISTENT_PORT | |
908 | ISCSI_PERSISTENT_ADDRESS | |
909 | ISCSI_TARGET_NAME | ISCSI_TPGT | |
910 | ISCSI_USERNAME | ISCSI_PASSWORD | |
911 | ISCSI_USERNAME_IN | ISCSI_PASSWORD_IN | |
912 | ISCSI_FAST_ABORT | ISCSI_ABORT_TMO | |
913 | ISCSI_LU_RESET_TMO | ISCSI_TGT_RESET_TMO | |
914 | ISCSI_PING_TMO | ISCSI_RECV_TMO | |
915 | ISCSI_IFACE_NAME | ISCSI_INITIATOR_NAME, |
916 | .host_param_mask = ISCSI_HOST_HWADDRESS | ISCSI_HOST_IPADDRESS | |
917 | ISCSI_HOST_INITIATOR_NAME | |
918 | ISCSI_HOST_NETDEV_NAME, |
919 | /* session management */ |
920 | .create_session = iscsi_sw_tcp_session_create, |
921 | .destroy_session = iscsi_sw_tcp_session_destroy, |
922 | /* connection management */ |
923 | .create_conn = iscsi_sw_tcp_conn_create, |
924 | .bind_conn = iscsi_sw_tcp_conn_bind, |
925 | .destroy_conn = iscsi_sw_tcp_conn_destroy, |
926 | .set_param = iscsi_sw_tcp_conn_set_param, |
927 | .get_conn_param = iscsi_sw_tcp_conn_get_param, |
928 | .get_session_param = iscsi_session_get_param, |
929 | .start_conn = iscsi_conn_start, |
930 | .stop_conn = iscsi_sw_tcp_conn_stop, |
931 | /* iscsi host params */ |
932 | .get_host_param = iscsi_host_get_param, |
933 | .set_host_param = iscsi_host_set_param, |
934 | /* IO */ |
935 | .send_pdu = iscsi_conn_send_pdu, |
936 | .get_stats = iscsi_sw_tcp_conn_get_stats, |
937 | /* iscsi task/cmd helpers */ |
938 | .init_task = iscsi_tcp_task_init, |
939 | .xmit_task = iscsi_tcp_task_xmit, |
940 | .cleanup_task = iscsi_tcp_cleanup_task, |
941 | /* low level pdu helpers */ |
942 | .xmit_pdu = iscsi_sw_tcp_pdu_xmit, |
943 | .init_pdu = iscsi_sw_tcp_pdu_init, |
944 | .alloc_pdu = iscsi_sw_tcp_pdu_alloc, |
945 | /* recovery */ |
946 | .session_recovery_timedout = iscsi_session_recovery_timedout, |
947 | }; |
948 | |
949 | static int __init iscsi_sw_tcp_init(void) |
950 | { |
951 | if (iscsi_max_lun < 1) { |
952 | printk(KERN_ERR "iscsi_tcp: Invalid max_lun value of %u\n", |
953 | iscsi_max_lun); |
954 | return -EINVAL; |
955 | } |
956 | |
957 | iscsi_sw_tcp_scsi_transport = iscsi_register_transport( |
958 | &iscsi_sw_tcp_transport); |
959 | if (!iscsi_sw_tcp_scsi_transport) |
960 | return -ENODEV; |
961 | |
962 | return 0; |
963 | } |
964 | |
965 | static void __exit iscsi_sw_tcp_exit(void) |
966 | { |
967 | iscsi_unregister_transport(&iscsi_sw_tcp_transport); |
968 | } |
969 | |
970 | module_init(iscsi_sw_tcp_init); |
971 | module_exit(iscsi_sw_tcp_exit); |
972 |
Branches:
ben-wpan
ben-wpan-stefan
javiroman/ks7010
jz-2.6.34
jz-2.6.34-rc5
jz-2.6.34-rc6
jz-2.6.34-rc7
jz-2.6.35
jz-2.6.36
jz-2.6.37
jz-2.6.38
jz-2.6.39
jz-3.0
jz-3.1
jz-3.11
jz-3.12
jz-3.13
jz-3.15
jz-3.16
jz-3.18-dt
jz-3.2
jz-3.3
jz-3.4
jz-3.5
jz-3.6
jz-3.6-rc2-pwm
jz-3.9
jz-3.9-clk
jz-3.9-rc8
jz47xx
jz47xx-2.6.38
master
Tags:
od-2011-09-04
od-2011-09-18
v2.6.34-rc5
v2.6.34-rc6
v2.6.34-rc7
v3.9