2 * Copyright (c) 2006 - 2009 Mellanox Technology Inc. All rights reserved.
3 * Copyright (C) 2008 - 2011 Bart Van Assche <bvanassche@acm.org>.
5 * This software is available to you under a choice of one of two
6 * licenses. You may choose to be licensed under the terms of the GNU
7 * General Public License (GPL) Version 2, available from the file
8 * COPYING in the main directory of this source tree, or the
9 * OpenIB.org BSD license below:
11 * Redistribution and use in source and binary forms, with or
12 * without modification, are permitted provided that the following
15 * - Redistributions of source code must retain the above
16 * copyright notice, this list of conditions and the following
19 * - Redistributions in binary form must reproduce the above
20 * copyright notice, this list of conditions and the following
21 * disclaimer in the documentation and/or other materials
22 * provided with the distribution.
24 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
25 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
26 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
27 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
28 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
29 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
30 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
35 #include <linux/module.h>
36 #include <linux/init.h>
37 #include <linux/slab.h>
38 #include <linux/err.h>
39 #include <linux/ctype.h>
40 #include <linux/kthread.h>
41 #include <linux/string.h>
42 #include <linux/delay.h>
43 #include <linux/atomic.h>
44 #include <scsi/scsi_tcq.h>
45 #include <target/configfs_macros.h>
46 #include <target/target_core_base.h>
47 #include <target/target_core_fabric_configfs.h>
48 #include <target/target_core_fabric.h>
49 #include <target/target_core_configfs.h>
52 /* Name of this kernel module. */
53 #define DRV_NAME "ib_srpt"
54 #define DRV_VERSION "2.0.0"
55 #define DRV_RELDATE "2011-02-14"
57 #define SRPT_ID_STRING "Linux SRP target"
60 #define pr_fmt(fmt) DRV_NAME " " fmt
62 MODULE_AUTHOR("Vu Pham and Bart Van Assche");
63 MODULE_DESCRIPTION("InfiniBand SCSI RDMA Protocol target "
64 "v" DRV_VERSION
" (" DRV_RELDATE
")");
65 MODULE_LICENSE("Dual BSD/GPL");
71 static u64 srpt_service_guid
;
72 static DEFINE_SPINLOCK(srpt_dev_lock
); /* Protects srpt_dev_list. */
73 static LIST_HEAD(srpt_dev_list
); /* List of srpt_device structures. */
75 static unsigned srp_max_req_size
= DEFAULT_MAX_REQ_SIZE
;
76 module_param(srp_max_req_size
, int, 0444);
77 MODULE_PARM_DESC(srp_max_req_size
,
78 "Maximum size of SRP request messages in bytes.");
80 static int srpt_srq_size
= DEFAULT_SRPT_SRQ_SIZE
;
81 module_param(srpt_srq_size
, int, 0444);
82 MODULE_PARM_DESC(srpt_srq_size
,
83 "Shared receive queue (SRQ) size.");
85 static int srpt_get_u64_x(char *buffer
, struct kernel_param
*kp
)
87 return sprintf(buffer
, "0x%016llx", *(u64
*)kp
->arg
);
89 module_param_call(srpt_service_guid
, NULL
, srpt_get_u64_x
, &srpt_service_guid
,
91 MODULE_PARM_DESC(srpt_service_guid
,
92 "Using this value for ioc_guid, id_ext, and cm_listen_id"
93 " instead of using the node_guid of the first HCA.");
95 static struct ib_client srpt_client
;
96 static struct target_fabric_configfs
*srpt_target
;
97 static void srpt_release_channel(struct srpt_rdma_ch
*ch
);
98 static int srpt_queue_status(struct se_cmd
*cmd
);
101 * opposite_dma_dir() - Swap DMA_TO_DEVICE and DMA_FROM_DEVICE.
104 enum dma_data_direction
opposite_dma_dir(enum dma_data_direction dir
)
107 case DMA_TO_DEVICE
: return DMA_FROM_DEVICE
;
108 case DMA_FROM_DEVICE
: return DMA_TO_DEVICE
;
114 * srpt_sdev_name() - Return the name associated with the HCA.
116 * Examples are ib0, ib1, ...
118 static inline const char *srpt_sdev_name(struct srpt_device
*sdev
)
120 return sdev
->device
->name
;
123 static enum rdma_ch_state
srpt_get_ch_state(struct srpt_rdma_ch
*ch
)
126 enum rdma_ch_state state
;
128 spin_lock_irqsave(&ch
->spinlock
, flags
);
130 spin_unlock_irqrestore(&ch
->spinlock
, flags
);
134 static enum rdma_ch_state
135 srpt_set_ch_state(struct srpt_rdma_ch
*ch
, enum rdma_ch_state new_state
)
138 enum rdma_ch_state prev
;
140 spin_lock_irqsave(&ch
->spinlock
, flags
);
142 ch
->state
= new_state
;
143 spin_unlock_irqrestore(&ch
->spinlock
, flags
);
148 * srpt_test_and_set_ch_state() - Test and set the channel state.
150 * Returns true if and only if the channel state has been set to the new state.
153 srpt_test_and_set_ch_state(struct srpt_rdma_ch
*ch
, enum rdma_ch_state old
,
154 enum rdma_ch_state
new)
157 enum rdma_ch_state prev
;
159 spin_lock_irqsave(&ch
->spinlock
, flags
);
163 spin_unlock_irqrestore(&ch
->spinlock
, flags
);
168 * srpt_event_handler() - Asynchronous IB event callback function.
170 * Callback function called by the InfiniBand core when an asynchronous IB
171 * event occurs. This callback may occur in interrupt context. See also
172 * section 11.5.2, Set Asynchronous Event Handler in the InfiniBand
173 * Architecture Specification.
175 static void srpt_event_handler(struct ib_event_handler
*handler
,
176 struct ib_event
*event
)
178 struct srpt_device
*sdev
;
179 struct srpt_port
*sport
;
181 sdev
= ib_get_client_data(event
->device
, &srpt_client
);
182 if (!sdev
|| sdev
->device
!= event
->device
)
185 pr_debug("ASYNC event= %d on device= %s\n", event
->event
,
186 srpt_sdev_name(sdev
));
188 switch (event
->event
) {
189 case IB_EVENT_PORT_ERR
:
190 if (event
->element
.port_num
<= sdev
->device
->phys_port_cnt
) {
191 sport
= &sdev
->port
[event
->element
.port_num
- 1];
196 case IB_EVENT_PORT_ACTIVE
:
197 case IB_EVENT_LID_CHANGE
:
198 case IB_EVENT_PKEY_CHANGE
:
199 case IB_EVENT_SM_CHANGE
:
200 case IB_EVENT_CLIENT_REREGISTER
:
201 /* Refresh port data asynchronously. */
202 if (event
->element
.port_num
<= sdev
->device
->phys_port_cnt
) {
203 sport
= &sdev
->port
[event
->element
.port_num
- 1];
204 if (!sport
->lid
&& !sport
->sm_lid
)
205 schedule_work(&sport
->work
);
209 printk(KERN_ERR
"received unrecognized IB event %d\n",
216 * srpt_srq_event() - SRQ event callback function.
218 static void srpt_srq_event(struct ib_event
*event
, void *ctx
)
220 printk(KERN_INFO
"SRQ event %d\n", event
->event
);
224 * srpt_qp_event() - QP event callback function.
226 static void srpt_qp_event(struct ib_event
*event
, struct srpt_rdma_ch
*ch
)
228 pr_debug("QP event %d on cm_id=%p sess_name=%s state=%d\n",
229 event
->event
, ch
->cm_id
, ch
->sess_name
, srpt_get_ch_state(ch
));
231 switch (event
->event
) {
232 case IB_EVENT_COMM_EST
:
233 ib_cm_notify(ch
->cm_id
, event
->event
);
235 case IB_EVENT_QP_LAST_WQE_REACHED
:
236 if (srpt_test_and_set_ch_state(ch
, CH_DRAINING
,
238 srpt_release_channel(ch
);
240 pr_debug("%s: state %d - ignored LAST_WQE.\n",
241 ch
->sess_name
, srpt_get_ch_state(ch
));
244 printk(KERN_ERR
"received unrecognized IB QP event %d\n",
251 * srpt_set_ioc() - Helper function for initializing an IOUnitInfo structure.
253 * @slot: one-based slot number.
254 * @value: four-bit value.
256 * Copies the lowest four bits of value in element slot of the array of four
257 * bit elements called c_list (controller list). The index slot is one-based.
259 static void srpt_set_ioc(u8
*c_list
, u32 slot
, u8 value
)
266 tmp
= c_list
[id
] & 0xf;
267 c_list
[id
] = (value
<< 4) | tmp
;
269 tmp
= c_list
[id
] & 0xf0;
270 c_list
[id
] = (value
& 0xf) | tmp
;
275 * srpt_get_class_port_info() - Copy ClassPortInfo to a management datagram.
277 * See also section 16.3.3.1 ClassPortInfo in the InfiniBand Architecture
280 static void srpt_get_class_port_info(struct ib_dm_mad
*mad
)
282 struct ib_class_port_info
*cif
;
284 cif
= (struct ib_class_port_info
*)mad
->data
;
285 memset(cif
, 0, sizeof *cif
);
286 cif
->base_version
= 1;
287 cif
->class_version
= 1;
288 cif
->resp_time_value
= 20;
290 mad
->mad_hdr
.status
= 0;
294 * srpt_get_iou() - Write IOUnitInfo to a management datagram.
296 * See also section 16.3.3.3 IOUnitInfo in the InfiniBand Architecture
297 * Specification. See also section B.7, table B.6 in the SRP r16a document.
299 static void srpt_get_iou(struct ib_dm_mad
*mad
)
301 struct ib_dm_iou_info
*ioui
;
305 ioui
= (struct ib_dm_iou_info
*)mad
->data
;
306 ioui
->change_id
= __constant_cpu_to_be16(1);
307 ioui
->max_controllers
= 16;
309 /* set present for slot 1 and empty for the rest */
310 srpt_set_ioc(ioui
->controller_list
, 1, 1);
311 for (i
= 1, slot
= 2; i
< 16; i
++, slot
++)
312 srpt_set_ioc(ioui
->controller_list
, slot
, 0);
314 mad
->mad_hdr
.status
= 0;
318 * srpt_get_ioc() - Write IOControllerprofile to a management datagram.
320 * See also section 16.3.3.4 IOControllerProfile in the InfiniBand
321 * Architecture Specification. See also section B.7, table B.7 in the SRP
324 static void srpt_get_ioc(struct srpt_port
*sport
, u32 slot
,
325 struct ib_dm_mad
*mad
)
327 struct srpt_device
*sdev
= sport
->sdev
;
328 struct ib_dm_ioc_profile
*iocp
;
330 iocp
= (struct ib_dm_ioc_profile
*)mad
->data
;
332 if (!slot
|| slot
> 16) {
334 = __constant_cpu_to_be16(DM_MAD_STATUS_INVALID_FIELD
);
340 = __constant_cpu_to_be16(DM_MAD_STATUS_NO_IOC
);
344 memset(iocp
, 0, sizeof *iocp
);
345 strcpy(iocp
->id_string
, SRPT_ID_STRING
);
346 iocp
->guid
= cpu_to_be64(srpt_service_guid
);
347 iocp
->vendor_id
= cpu_to_be32(sdev
->dev_attr
.vendor_id
);
348 iocp
->device_id
= cpu_to_be32(sdev
->dev_attr
.vendor_part_id
);
349 iocp
->device_version
= cpu_to_be16(sdev
->dev_attr
.hw_ver
);
350 iocp
->subsys_vendor_id
= cpu_to_be32(sdev
->dev_attr
.vendor_id
);
351 iocp
->subsys_device_id
= 0x0;
352 iocp
->io_class
= __constant_cpu_to_be16(SRP_REV16A_IB_IO_CLASS
);
353 iocp
->io_subclass
= __constant_cpu_to_be16(SRP_IO_SUBCLASS
);
354 iocp
->protocol
= __constant_cpu_to_be16(SRP_PROTOCOL
);
355 iocp
->protocol_version
= __constant_cpu_to_be16(SRP_PROTOCOL_VERSION
);
356 iocp
->send_queue_depth
= cpu_to_be16(sdev
->srq_size
);
357 iocp
->rdma_read_depth
= 4;
358 iocp
->send_size
= cpu_to_be32(srp_max_req_size
);
359 iocp
->rdma_size
= cpu_to_be32(min(sport
->port_attrib
.srp_max_rdma_size
,
361 iocp
->num_svc_entries
= 1;
362 iocp
->op_cap_mask
= SRP_SEND_TO_IOC
| SRP_SEND_FROM_IOC
|
363 SRP_RDMA_READ_FROM_IOC
| SRP_RDMA_WRITE_FROM_IOC
;
365 mad
->mad_hdr
.status
= 0;
369 * srpt_get_svc_entries() - Write ServiceEntries to a management datagram.
371 * See also section 16.3.3.5 ServiceEntries in the InfiniBand Architecture
372 * Specification. See also section B.7, table B.8 in the SRP r16a document.
374 static void srpt_get_svc_entries(u64 ioc_guid
,
375 u16 slot
, u8 hi
, u8 lo
, struct ib_dm_mad
*mad
)
377 struct ib_dm_svc_entries
*svc_entries
;
381 if (!slot
|| slot
> 16) {
383 = __constant_cpu_to_be16(DM_MAD_STATUS_INVALID_FIELD
);
387 if (slot
> 2 || lo
> hi
|| hi
> 1) {
389 = __constant_cpu_to_be16(DM_MAD_STATUS_NO_IOC
);
393 svc_entries
= (struct ib_dm_svc_entries
*)mad
->data
;
394 memset(svc_entries
, 0, sizeof *svc_entries
);
395 svc_entries
->service_entries
[0].id
= cpu_to_be64(ioc_guid
);
396 snprintf(svc_entries
->service_entries
[0].name
,
397 sizeof(svc_entries
->service_entries
[0].name
),
399 SRP_SERVICE_NAME_PREFIX
,
402 mad
->mad_hdr
.status
= 0;
406 * srpt_mgmt_method_get() - Process a received management datagram.
407 * @sp: source port through which the MAD has been received.
408 * @rq_mad: received MAD.
409 * @rsp_mad: response MAD.
411 static void srpt_mgmt_method_get(struct srpt_port
*sp
, struct ib_mad
*rq_mad
,
412 struct ib_dm_mad
*rsp_mad
)
418 attr_id
= be16_to_cpu(rq_mad
->mad_hdr
.attr_id
);
420 case DM_ATTR_CLASS_PORT_INFO
:
421 srpt_get_class_port_info(rsp_mad
);
423 case DM_ATTR_IOU_INFO
:
424 srpt_get_iou(rsp_mad
);
426 case DM_ATTR_IOC_PROFILE
:
427 slot
= be32_to_cpu(rq_mad
->mad_hdr
.attr_mod
);
428 srpt_get_ioc(sp
, slot
, rsp_mad
);
430 case DM_ATTR_SVC_ENTRIES
:
431 slot
= be32_to_cpu(rq_mad
->mad_hdr
.attr_mod
);
432 hi
= (u8
) ((slot
>> 8) & 0xff);
433 lo
= (u8
) (slot
& 0xff);
434 slot
= (u16
) ((slot
>> 16) & 0xffff);
435 srpt_get_svc_entries(srpt_service_guid
,
436 slot
, hi
, lo
, rsp_mad
);
439 rsp_mad
->mad_hdr
.status
=
440 __constant_cpu_to_be16(DM_MAD_STATUS_UNSUP_METHOD_ATTR
);
446 * srpt_mad_send_handler() - Post MAD-send callback function.
448 static void srpt_mad_send_handler(struct ib_mad_agent
*mad_agent
,
449 struct ib_mad_send_wc
*mad_wc
)
451 ib_destroy_ah(mad_wc
->send_buf
->ah
);
452 ib_free_send_mad(mad_wc
->send_buf
);
456 * srpt_mad_recv_handler() - MAD reception callback function.
458 static void srpt_mad_recv_handler(struct ib_mad_agent
*mad_agent
,
459 struct ib_mad_recv_wc
*mad_wc
)
461 struct srpt_port
*sport
= (struct srpt_port
*)mad_agent
->context
;
463 struct ib_mad_send_buf
*rsp
;
464 struct ib_dm_mad
*dm_mad
;
466 if (!mad_wc
|| !mad_wc
->recv_buf
.mad
)
469 ah
= ib_create_ah_from_wc(mad_agent
->qp
->pd
, mad_wc
->wc
,
470 mad_wc
->recv_buf
.grh
, mad_agent
->port_num
);
474 BUILD_BUG_ON(offsetof(struct ib_dm_mad
, data
) != IB_MGMT_DEVICE_HDR
);
476 rsp
= ib_create_send_mad(mad_agent
, mad_wc
->wc
->src_qp
,
477 mad_wc
->wc
->pkey_index
, 0,
478 IB_MGMT_DEVICE_HDR
, IB_MGMT_DEVICE_DATA
,
486 memcpy(dm_mad
, mad_wc
->recv_buf
.mad
, sizeof *dm_mad
);
487 dm_mad
->mad_hdr
.method
= IB_MGMT_METHOD_GET_RESP
;
488 dm_mad
->mad_hdr
.status
= 0;
490 switch (mad_wc
->recv_buf
.mad
->mad_hdr
.method
) {
491 case IB_MGMT_METHOD_GET
:
492 srpt_mgmt_method_get(sport
, mad_wc
->recv_buf
.mad
, dm_mad
);
494 case IB_MGMT_METHOD_SET
:
495 dm_mad
->mad_hdr
.status
=
496 __constant_cpu_to_be16(DM_MAD_STATUS_UNSUP_METHOD_ATTR
);
499 dm_mad
->mad_hdr
.status
=
500 __constant_cpu_to_be16(DM_MAD_STATUS_UNSUP_METHOD
);
504 if (!ib_post_send_mad(rsp
, NULL
)) {
505 ib_free_recv_mad(mad_wc
);
506 /* will destroy_ah & free_send_mad in send completion */
510 ib_free_send_mad(rsp
);
515 ib_free_recv_mad(mad_wc
);
519 * srpt_refresh_port() - Configure a HCA port.
521 * Enable InfiniBand management datagram processing, update the cached sm_lid,
522 * lid and gid values, and register a callback function for processing MADs
523 * on the specified port.
525 * Note: It is safe to call this function more than once for the same port.
527 static int srpt_refresh_port(struct srpt_port
*sport
)
529 struct ib_mad_reg_req reg_req
;
530 struct ib_port_modify port_modify
;
531 struct ib_port_attr port_attr
;
534 memset(&port_modify
, 0, sizeof port_modify
);
535 port_modify
.set_port_cap_mask
= IB_PORT_DEVICE_MGMT_SUP
;
536 port_modify
.clr_port_cap_mask
= 0;
538 ret
= ib_modify_port(sport
->sdev
->device
, sport
->port
, 0, &port_modify
);
542 ret
= ib_query_port(sport
->sdev
->device
, sport
->port
, &port_attr
);
546 sport
->sm_lid
= port_attr
.sm_lid
;
547 sport
->lid
= port_attr
.lid
;
549 ret
= ib_query_gid(sport
->sdev
->device
, sport
->port
, 0, &sport
->gid
);
553 if (!sport
->mad_agent
) {
554 memset(®_req
, 0, sizeof reg_req
);
555 reg_req
.mgmt_class
= IB_MGMT_CLASS_DEVICE_MGMT
;
556 reg_req
.mgmt_class_version
= IB_MGMT_BASE_VERSION
;
557 set_bit(IB_MGMT_METHOD_GET
, reg_req
.method_mask
);
558 set_bit(IB_MGMT_METHOD_SET
, reg_req
.method_mask
);
560 sport
->mad_agent
= ib_register_mad_agent(sport
->sdev
->device
,
564 srpt_mad_send_handler
,
565 srpt_mad_recv_handler
,
567 if (IS_ERR(sport
->mad_agent
)) {
568 ret
= PTR_ERR(sport
->mad_agent
);
569 sport
->mad_agent
= NULL
;
578 port_modify
.set_port_cap_mask
= 0;
579 port_modify
.clr_port_cap_mask
= IB_PORT_DEVICE_MGMT_SUP
;
580 ib_modify_port(sport
->sdev
->device
, sport
->port
, 0, &port_modify
);
588 * srpt_unregister_mad_agent() - Unregister MAD callback functions.
590 * Note: It is safe to call this function more than once for the same device.
592 static void srpt_unregister_mad_agent(struct srpt_device
*sdev
)
594 struct ib_port_modify port_modify
= {
595 .clr_port_cap_mask
= IB_PORT_DEVICE_MGMT_SUP
,
597 struct srpt_port
*sport
;
600 for (i
= 1; i
<= sdev
->device
->phys_port_cnt
; i
++) {
601 sport
= &sdev
->port
[i
- 1];
602 WARN_ON(sport
->port
!= i
);
603 if (ib_modify_port(sdev
->device
, i
, 0, &port_modify
) < 0)
604 printk(KERN_ERR
"disabling MAD processing failed.\n");
605 if (sport
->mad_agent
) {
606 ib_unregister_mad_agent(sport
->mad_agent
);
607 sport
->mad_agent
= NULL
;
613 * srpt_alloc_ioctx() - Allocate an SRPT I/O context structure.
615 static struct srpt_ioctx
*srpt_alloc_ioctx(struct srpt_device
*sdev
,
616 int ioctx_size
, int dma_size
,
617 enum dma_data_direction dir
)
619 struct srpt_ioctx
*ioctx
;
621 ioctx
= kmalloc(ioctx_size
, GFP_KERNEL
);
625 ioctx
->buf
= kmalloc(dma_size
, GFP_KERNEL
);
629 ioctx
->dma
= ib_dma_map_single(sdev
->device
, ioctx
->buf
, dma_size
, dir
);
630 if (ib_dma_mapping_error(sdev
->device
, ioctx
->dma
))
644 * srpt_free_ioctx() - Free an SRPT I/O context structure.
646 static void srpt_free_ioctx(struct srpt_device
*sdev
, struct srpt_ioctx
*ioctx
,
647 int dma_size
, enum dma_data_direction dir
)
652 ib_dma_unmap_single(sdev
->device
, ioctx
->dma
, dma_size
, dir
);
658 * srpt_alloc_ioctx_ring() - Allocate a ring of SRPT I/O context structures.
659 * @sdev: Device to allocate the I/O context ring for.
660 * @ring_size: Number of elements in the I/O context ring.
661 * @ioctx_size: I/O context size.
662 * @dma_size: DMA buffer size.
663 * @dir: DMA data direction.
665 static struct srpt_ioctx
**srpt_alloc_ioctx_ring(struct srpt_device
*sdev
,
666 int ring_size
, int ioctx_size
,
667 int dma_size
, enum dma_data_direction dir
)
669 struct srpt_ioctx
**ring
;
672 WARN_ON(ioctx_size
!= sizeof(struct srpt_recv_ioctx
)
673 && ioctx_size
!= sizeof(struct srpt_send_ioctx
));
675 ring
= kmalloc(ring_size
* sizeof(ring
[0]), GFP_KERNEL
);
678 for (i
= 0; i
< ring_size
; ++i
) {
679 ring
[i
] = srpt_alloc_ioctx(sdev
, ioctx_size
, dma_size
, dir
);
688 srpt_free_ioctx(sdev
, ring
[i
], dma_size
, dir
);
696 * srpt_free_ioctx_ring() - Free the ring of SRPT I/O context structures.
698 static void srpt_free_ioctx_ring(struct srpt_ioctx
**ioctx_ring
,
699 struct srpt_device
*sdev
, int ring_size
,
700 int dma_size
, enum dma_data_direction dir
)
704 for (i
= 0; i
< ring_size
; ++i
)
705 srpt_free_ioctx(sdev
, ioctx_ring
[i
], dma_size
, dir
);
710 * srpt_get_cmd_state() - Get the state of a SCSI command.
712 static enum srpt_command_state
srpt_get_cmd_state(struct srpt_send_ioctx
*ioctx
)
714 enum srpt_command_state state
;
719 spin_lock_irqsave(&ioctx
->spinlock
, flags
);
720 state
= ioctx
->state
;
721 spin_unlock_irqrestore(&ioctx
->spinlock
, flags
);
726 * srpt_set_cmd_state() - Set the state of a SCSI command.
728 * Does not modify the state of aborted commands. Returns the previous command
731 static enum srpt_command_state
srpt_set_cmd_state(struct srpt_send_ioctx
*ioctx
,
732 enum srpt_command_state
new)
734 enum srpt_command_state previous
;
739 spin_lock_irqsave(&ioctx
->spinlock
, flags
);
740 previous
= ioctx
->state
;
741 if (previous
!= SRPT_STATE_DONE
)
743 spin_unlock_irqrestore(&ioctx
->spinlock
, flags
);
749 * srpt_test_and_set_cmd_state() - Test and set the state of a command.
751 * Returns true if and only if the previous command state was equal to 'old'.
753 static bool srpt_test_and_set_cmd_state(struct srpt_send_ioctx
*ioctx
,
754 enum srpt_command_state old
,
755 enum srpt_command_state
new)
757 enum srpt_command_state previous
;
761 WARN_ON(old
== SRPT_STATE_DONE
);
762 WARN_ON(new == SRPT_STATE_NEW
);
764 spin_lock_irqsave(&ioctx
->spinlock
, flags
);
765 previous
= ioctx
->state
;
768 spin_unlock_irqrestore(&ioctx
->spinlock
, flags
);
769 return previous
== old
;
773 * srpt_post_recv() - Post an IB receive request.
775 static int srpt_post_recv(struct srpt_device
*sdev
,
776 struct srpt_recv_ioctx
*ioctx
)
779 struct ib_recv_wr wr
, *bad_wr
;
782 wr
.wr_id
= encode_wr_id(SRPT_RECV
, ioctx
->ioctx
.index
);
784 list
.addr
= ioctx
->ioctx
.dma
;
785 list
.length
= srp_max_req_size
;
786 list
.lkey
= sdev
->mr
->lkey
;
792 return ib_post_srq_recv(sdev
->srq
, &wr
, &bad_wr
);
796 * srpt_post_send() - Post an IB send request.
798 * Returns zero upon success and a non-zero value upon failure.
800 static int srpt_post_send(struct srpt_rdma_ch
*ch
,
801 struct srpt_send_ioctx
*ioctx
, int len
)
804 struct ib_send_wr wr
, *bad_wr
;
805 struct srpt_device
*sdev
= ch
->sport
->sdev
;
808 atomic_inc(&ch
->req_lim
);
811 if (unlikely(atomic_dec_return(&ch
->sq_wr_avail
) < 0)) {
812 printk(KERN_WARNING
"IB send queue full (needed 1)\n");
816 ib_dma_sync_single_for_device(sdev
->device
, ioctx
->ioctx
.dma
, len
,
819 list
.addr
= ioctx
->ioctx
.dma
;
821 list
.lkey
= sdev
->mr
->lkey
;
824 wr
.wr_id
= encode_wr_id(SRPT_SEND
, ioctx
->ioctx
.index
);
827 wr
.opcode
= IB_WR_SEND
;
828 wr
.send_flags
= IB_SEND_SIGNALED
;
830 ret
= ib_post_send(ch
->qp
, &wr
, &bad_wr
);
834 atomic_inc(&ch
->sq_wr_avail
);
835 atomic_dec(&ch
->req_lim
);
841 * srpt_get_desc_tbl() - Parse the data descriptors of an SRP_CMD request.
842 * @ioctx: Pointer to the I/O context associated with the request.
843 * @srp_cmd: Pointer to the SRP_CMD request data.
844 * @dir: Pointer to the variable to which the transfer direction will be
846 * @data_len: Pointer to the variable to which the total data length of all
847 * descriptors in the SRP_CMD request will be written.
849 * This function initializes ioctx->nrbuf and ioctx->r_bufs.
851 * Returns -EINVAL when the SRP_CMD request contains inconsistent descriptors;
852 * -ENOMEM when memory allocation fails and zero upon success.
854 static int srpt_get_desc_tbl(struct srpt_send_ioctx
*ioctx
,
855 struct srp_cmd
*srp_cmd
,
856 enum dma_data_direction
*dir
, u64
*data_len
)
858 struct srp_indirect_buf
*idb
;
859 struct srp_direct_buf
*db
;
860 unsigned add_cdb_offset
;
864 * The pointer computations below will only be compiled correctly
865 * if srp_cmd::add_data is declared as s8*, u8*, s8[] or u8[], so check
866 * whether srp_cmd::add_data has been declared as a byte pointer.
868 BUILD_BUG_ON(!__same_type(srp_cmd
->add_data
[0], (s8
)0)
869 && !__same_type(srp_cmd
->add_data
[0], (u8
)0));
878 * The lower four bits of the buffer format field contain the DATA-IN
879 * buffer descriptor format, and the highest four bits contain the
880 * DATA-OUT buffer descriptor format.
883 if (srp_cmd
->buf_fmt
& 0xf)
884 /* DATA-IN: transfer data from target to initiator (read). */
885 *dir
= DMA_FROM_DEVICE
;
886 else if (srp_cmd
->buf_fmt
>> 4)
887 /* DATA-OUT: transfer data from initiator to target (write). */
888 *dir
= DMA_TO_DEVICE
;
891 * According to the SRP spec, the lower two bits of the 'ADDITIONAL
892 * CDB LENGTH' field are reserved and the size in bytes of this field
893 * is four times the value specified in bits 3..7. Hence the "& ~3".
895 add_cdb_offset
= srp_cmd
->add_cdb_len
& ~3;
896 if (((srp_cmd
->buf_fmt
& 0xf) == SRP_DATA_DESC_DIRECT
) ||
897 ((srp_cmd
->buf_fmt
>> 4) == SRP_DATA_DESC_DIRECT
)) {
899 ioctx
->rbufs
= &ioctx
->single_rbuf
;
901 db
= (struct srp_direct_buf
*)(srp_cmd
->add_data
903 memcpy(ioctx
->rbufs
, db
, sizeof *db
);
904 *data_len
= be32_to_cpu(db
->len
);
905 } else if (((srp_cmd
->buf_fmt
& 0xf) == SRP_DATA_DESC_INDIRECT
) ||
906 ((srp_cmd
->buf_fmt
>> 4) == SRP_DATA_DESC_INDIRECT
)) {
907 idb
= (struct srp_indirect_buf
*)(srp_cmd
->add_data
910 ioctx
->n_rbuf
= be32_to_cpu(idb
->table_desc
.len
) / sizeof *db
;
913 (srp_cmd
->data_out_desc_cnt
+ srp_cmd
->data_in_desc_cnt
)) {
914 printk(KERN_ERR
"received unsupported SRP_CMD request"
915 " type (%u out + %u in != %u / %zu)\n",
916 srp_cmd
->data_out_desc_cnt
,
917 srp_cmd
->data_in_desc_cnt
,
918 be32_to_cpu(idb
->table_desc
.len
),
925 if (ioctx
->n_rbuf
== 1)
926 ioctx
->rbufs
= &ioctx
->single_rbuf
;
929 kmalloc(ioctx
->n_rbuf
* sizeof *db
, GFP_ATOMIC
);
938 memcpy(ioctx
->rbufs
, db
, ioctx
->n_rbuf
* sizeof *db
);
939 *data_len
= be32_to_cpu(idb
->len
);
946 * srpt_init_ch_qp() - Initialize queue pair attributes.
948 * Initialized the attributes of queue pair 'qp' by allowing local write,
949 * remote read and remote write. Also transitions 'qp' to state IB_QPS_INIT.
951 static int srpt_init_ch_qp(struct srpt_rdma_ch
*ch
, struct ib_qp
*qp
)
953 struct ib_qp_attr
*attr
;
956 attr
= kzalloc(sizeof *attr
, GFP_KERNEL
);
960 attr
->qp_state
= IB_QPS_INIT
;
961 attr
->qp_access_flags
= IB_ACCESS_LOCAL_WRITE
| IB_ACCESS_REMOTE_READ
|
962 IB_ACCESS_REMOTE_WRITE
;
963 attr
->port_num
= ch
->sport
->port
;
964 attr
->pkey_index
= 0;
966 ret
= ib_modify_qp(qp
, attr
,
967 IB_QP_STATE
| IB_QP_ACCESS_FLAGS
| IB_QP_PORT
|
975 * srpt_ch_qp_rtr() - Change the state of a channel to 'ready to receive' (RTR).
976 * @ch: channel of the queue pair.
977 * @qp: queue pair to change the state of.
979 * Returns zero upon success and a negative value upon failure.
981 * Note: currently a struct ib_qp_attr takes 136 bytes on a 64-bit system.
982 * If this structure ever becomes larger, it might be necessary to allocate
983 * it dynamically instead of on the stack.
985 static int srpt_ch_qp_rtr(struct srpt_rdma_ch
*ch
, struct ib_qp
*qp
)
987 struct ib_qp_attr qp_attr
;
991 qp_attr
.qp_state
= IB_QPS_RTR
;
992 ret
= ib_cm_init_qp_attr(ch
->cm_id
, &qp_attr
, &attr_mask
);
996 qp_attr
.max_dest_rd_atomic
= 4;
998 ret
= ib_modify_qp(qp
, &qp_attr
, attr_mask
);
1005 * srpt_ch_qp_rts() - Change the state of a channel to 'ready to send' (RTS).
1006 * @ch: channel of the queue pair.
1007 * @qp: queue pair to change the state of.
1009 * Returns zero upon success and a negative value upon failure.
1011 * Note: currently a struct ib_qp_attr takes 136 bytes on a 64-bit system.
1012 * If this structure ever becomes larger, it might be necessary to allocate
1013 * it dynamically instead of on the stack.
1015 static int srpt_ch_qp_rts(struct srpt_rdma_ch
*ch
, struct ib_qp
*qp
)
1017 struct ib_qp_attr qp_attr
;
1021 qp_attr
.qp_state
= IB_QPS_RTS
;
1022 ret
= ib_cm_init_qp_attr(ch
->cm_id
, &qp_attr
, &attr_mask
);
1026 qp_attr
.max_rd_atomic
= 4;
1028 ret
= ib_modify_qp(qp
, &qp_attr
, attr_mask
);
1035 * srpt_ch_qp_err() - Set the channel queue pair state to 'error'.
1037 static int srpt_ch_qp_err(struct srpt_rdma_ch
*ch
)
1039 struct ib_qp_attr qp_attr
;
1041 qp_attr
.qp_state
= IB_QPS_ERR
;
1042 return ib_modify_qp(ch
->qp
, &qp_attr
, IB_QP_STATE
);
1046 * srpt_unmap_sg_to_ib_sge() - Unmap an IB SGE list.
1048 static void srpt_unmap_sg_to_ib_sge(struct srpt_rdma_ch
*ch
,
1049 struct srpt_send_ioctx
*ioctx
)
1051 struct scatterlist
*sg
;
1052 enum dma_data_direction dir
;
1056 BUG_ON(ioctx
->n_rdma
&& !ioctx
->rdma_ius
);
1058 while (ioctx
->n_rdma
)
1059 kfree(ioctx
->rdma_ius
[--ioctx
->n_rdma
].sge
);
1061 kfree(ioctx
->rdma_ius
);
1062 ioctx
->rdma_ius
= NULL
;
1064 if (ioctx
->mapped_sg_count
) {
1067 dir
= ioctx
->cmd
.data_direction
;
1068 BUG_ON(dir
== DMA_NONE
);
1069 ib_dma_unmap_sg(ch
->sport
->sdev
->device
, sg
, ioctx
->sg_cnt
,
1070 opposite_dma_dir(dir
));
1071 ioctx
->mapped_sg_count
= 0;
1076 * srpt_map_sg_to_ib_sge() - Map an SG list to an IB SGE list.
1078 static int srpt_map_sg_to_ib_sge(struct srpt_rdma_ch
*ch
,
1079 struct srpt_send_ioctx
*ioctx
)
1082 struct scatterlist
*sg
, *sg_orig
;
1084 enum dma_data_direction dir
;
1085 struct rdma_iu
*riu
;
1086 struct srp_direct_buf
*db
;
1087 dma_addr_t dma_addr
;
1099 dir
= cmd
->data_direction
;
1100 BUG_ON(dir
== DMA_NONE
);
1102 ioctx
->sg
= sg
= sg_orig
= cmd
->t_data_sg
;
1103 ioctx
->sg_cnt
= sg_cnt
= cmd
->t_data_nents
;
1105 count
= ib_dma_map_sg(ch
->sport
->sdev
->device
, sg
, sg_cnt
,
1106 opposite_dma_dir(dir
));
1107 if (unlikely(!count
))
1110 ioctx
->mapped_sg_count
= count
;
1112 if (ioctx
->rdma_ius
&& ioctx
->n_rdma_ius
)
1113 nrdma
= ioctx
->n_rdma_ius
;
1115 nrdma
= (count
+ SRPT_DEF_SG_PER_WQE
- 1) / SRPT_DEF_SG_PER_WQE
1118 ioctx
->rdma_ius
= kzalloc(nrdma
* sizeof *riu
, GFP_KERNEL
);
1119 if (!ioctx
->rdma_ius
)
1122 ioctx
->n_rdma_ius
= nrdma
;
1126 tsize
= cmd
->data_length
;
1127 dma_len
= sg_dma_len(&sg
[0]);
1128 riu
= ioctx
->rdma_ius
;
1131 * For each remote desc - calculate the #ib_sge.
1132 * If #ib_sge < SRPT_DEF_SG_PER_WQE per rdma operation then
1133 * each remote desc rdma_iu is required a rdma wr;
1135 * we need to allocate extra rdma_iu to carry extra #ib_sge in
1139 j
< count
&& i
< ioctx
->n_rbuf
&& tsize
> 0; ++i
, ++riu
, ++db
) {
1140 rsize
= be32_to_cpu(db
->len
);
1141 raddr
= be64_to_cpu(db
->va
);
1143 riu
->rkey
= be32_to_cpu(db
->key
);
1146 /* calculate how many sge required for this remote_buf */
1147 while (rsize
> 0 && tsize
> 0) {
1149 if (rsize
>= dma_len
) {
1158 dma_len
= sg_dma_len(sg
);
1169 if (rsize
> 0 && riu
->sge_cnt
== SRPT_DEF_SG_PER_WQE
) {
1172 kmalloc(riu
->sge_cnt
* sizeof *riu
->sge
,
1180 riu
->rkey
= be32_to_cpu(db
->key
);
1185 riu
->sge
= kmalloc(riu
->sge_cnt
* sizeof *riu
->sge
,
1192 tsize
= cmd
->data_length
;
1193 riu
= ioctx
->rdma_ius
;
1195 dma_len
= sg_dma_len(&sg
[0]);
1196 dma_addr
= sg_dma_address(&sg
[0]);
1198 /* this second loop is really mapped sg_addres to rdma_iu->ib_sge */
1200 j
< count
&& i
< ioctx
->n_rbuf
&& tsize
> 0; ++i
, ++riu
, ++db
) {
1201 rsize
= be32_to_cpu(db
->len
);
1205 while (rsize
> 0 && tsize
> 0) {
1206 sge
->addr
= dma_addr
;
1207 sge
->lkey
= ch
->sport
->sdev
->mr
->lkey
;
1209 if (rsize
>= dma_len
) {
1211 (tsize
< dma_len
) ? tsize
: dma_len
;
1219 dma_len
= sg_dma_len(sg
);
1220 dma_addr
= sg_dma_address(sg
);
1224 sge
->length
= (tsize
< rsize
) ? tsize
: rsize
;
1232 if (k
== riu
->sge_cnt
&& rsize
> 0 && tsize
> 0) {
1236 } else if (rsize
> 0 && tsize
> 0)
1244 srpt_unmap_sg_to_ib_sge(ch
, ioctx
);
1250 * srpt_get_send_ioctx() - Obtain an I/O context for sending to the initiator.
1252 static struct srpt_send_ioctx
*srpt_get_send_ioctx(struct srpt_rdma_ch
*ch
)
1254 struct srpt_send_ioctx
*ioctx
;
1255 unsigned long flags
;
1260 spin_lock_irqsave(&ch
->spinlock
, flags
);
1261 if (!list_empty(&ch
->free_list
)) {
1262 ioctx
= list_first_entry(&ch
->free_list
,
1263 struct srpt_send_ioctx
, free_list
);
1264 list_del(&ioctx
->free_list
);
1266 spin_unlock_irqrestore(&ch
->spinlock
, flags
);
1271 BUG_ON(ioctx
->ch
!= ch
);
1272 kref_init(&ioctx
->kref
);
1273 spin_lock_init(&ioctx
->spinlock
);
1274 ioctx
->state
= SRPT_STATE_NEW
;
1276 ioctx
->rbufs
= NULL
;
1278 ioctx
->n_rdma_ius
= 0;
1279 ioctx
->rdma_ius
= NULL
;
1280 ioctx
->mapped_sg_count
= 0;
1281 init_completion(&ioctx
->tx_done
);
1282 ioctx
->queue_status_only
= false;
1284 * transport_init_se_cmd() does not initialize all fields, so do it
1287 memset(&ioctx
->cmd
, 0, sizeof(ioctx
->cmd
));
1288 memset(&ioctx
->sense_data
, 0, sizeof(ioctx
->sense_data
));
1294 * srpt_put_send_ioctx() - Free up resources.
1296 static void srpt_put_send_ioctx(struct srpt_send_ioctx
*ioctx
)
1298 struct srpt_rdma_ch
*ch
;
1299 unsigned long flags
;
1305 WARN_ON(srpt_get_cmd_state(ioctx
) != SRPT_STATE_DONE
);
1307 srpt_unmap_sg_to_ib_sge(ioctx
->ch
, ioctx
);
1308 transport_generic_free_cmd(&ioctx
->cmd
, 0);
1310 if (ioctx
->n_rbuf
> 1) {
1311 kfree(ioctx
->rbufs
);
1312 ioctx
->rbufs
= NULL
;
1316 spin_lock_irqsave(&ch
->spinlock
, flags
);
1317 list_add(&ioctx
->free_list
, &ch
->free_list
);
1318 spin_unlock_irqrestore(&ch
->spinlock
, flags
);
1321 static void srpt_put_send_ioctx_kref(struct kref
*kref
)
1323 srpt_put_send_ioctx(container_of(kref
, struct srpt_send_ioctx
, kref
));
1327 * srpt_abort_cmd() - Abort a SCSI command.
1328 * @ioctx: I/O context associated with the SCSI command.
1329 * @context: Preferred execution context.
1331 static int srpt_abort_cmd(struct srpt_send_ioctx
*ioctx
)
1333 enum srpt_command_state state
;
1334 unsigned long flags
;
1339 * If the command is in a state where the target core is waiting for
1340 * the ib_srpt driver, change the state to the next state. Changing
1341 * the state of the command from SRPT_STATE_NEED_DATA to
1342 * SRPT_STATE_DATA_IN ensures that srpt_xmit_response() will call this
1343 * function a second time.
1346 spin_lock_irqsave(&ioctx
->spinlock
, flags
);
1347 state
= ioctx
->state
;
1349 case SRPT_STATE_NEED_DATA
:
1350 ioctx
->state
= SRPT_STATE_DATA_IN
;
1352 case SRPT_STATE_DATA_IN
:
1353 case SRPT_STATE_CMD_RSP_SENT
:
1354 case SRPT_STATE_MGMT_RSP_SENT
:
1355 ioctx
->state
= SRPT_STATE_DONE
;
1360 spin_unlock_irqrestore(&ioctx
->spinlock
, flags
);
1362 if (state
== SRPT_STATE_DONE
)
1365 pr_debug("Aborting cmd with state %d and tag %lld\n", state
,
1369 case SRPT_STATE_NEW
:
1370 case SRPT_STATE_DATA_IN
:
1371 case SRPT_STATE_MGMT
:
1373 * Do nothing - defer abort processing until
1374 * srpt_queue_response() is invoked.
1376 WARN_ON(!transport_check_aborted_status(&ioctx
->cmd
, false));
1378 case SRPT_STATE_NEED_DATA
:
1379 /* DMA_TO_DEVICE (write) - RDMA read error. */
1380 spin_lock_irqsave(&ioctx
->cmd
.t_state_lock
, flags
);
1381 ioctx
->cmd
.transport_state
|= CMD_T_LUN_STOP
;
1382 spin_unlock_irqrestore(&ioctx
->cmd
.t_state_lock
, flags
);
1383 transport_generic_handle_data(&ioctx
->cmd
);
1385 case SRPT_STATE_CMD_RSP_SENT
:
1387 * SRP_RSP sending failed or the SRP_RSP send completion has
1388 * not been received in time.
1390 srpt_unmap_sg_to_ib_sge(ioctx
->ch
, ioctx
);
1391 spin_lock_irqsave(&ioctx
->cmd
.t_state_lock
, flags
);
1392 ioctx
->cmd
.transport_state
|= CMD_T_LUN_STOP
;
1393 spin_unlock_irqrestore(&ioctx
->cmd
.t_state_lock
, flags
);
1394 kref_put(&ioctx
->kref
, srpt_put_send_ioctx_kref
);
1396 case SRPT_STATE_MGMT_RSP_SENT
:
1397 srpt_set_cmd_state(ioctx
, SRPT_STATE_DONE
);
1398 kref_put(&ioctx
->kref
, srpt_put_send_ioctx_kref
);
1401 WARN_ON("ERROR: unexpected command state");
1410 * srpt_handle_send_err_comp() - Process an IB_WC_SEND error completion.
1412 static void srpt_handle_send_err_comp(struct srpt_rdma_ch
*ch
, u64 wr_id
)
1414 struct srpt_send_ioctx
*ioctx
;
1415 enum srpt_command_state state
;
1419 atomic_inc(&ch
->sq_wr_avail
);
1421 index
= idx_from_wr_id(wr_id
);
1422 ioctx
= ch
->ioctx_ring
[index
];
1423 state
= srpt_get_cmd_state(ioctx
);
1426 WARN_ON(state
!= SRPT_STATE_CMD_RSP_SENT
1427 && state
!= SRPT_STATE_MGMT_RSP_SENT
1428 && state
!= SRPT_STATE_NEED_DATA
1429 && state
!= SRPT_STATE_DONE
);
1431 /* If SRP_RSP sending failed, undo the ch->req_lim change. */
1432 if (state
== SRPT_STATE_CMD_RSP_SENT
1433 || state
== SRPT_STATE_MGMT_RSP_SENT
)
1434 atomic_dec(&ch
->req_lim
);
1436 srpt_abort_cmd(ioctx
);
1440 * srpt_handle_send_comp() - Process an IB send completion notification.
1442 static void srpt_handle_send_comp(struct srpt_rdma_ch
*ch
,
1443 struct srpt_send_ioctx
*ioctx
)
1445 enum srpt_command_state state
;
1447 atomic_inc(&ch
->sq_wr_avail
);
1449 state
= srpt_set_cmd_state(ioctx
, SRPT_STATE_DONE
);
1451 if (WARN_ON(state
!= SRPT_STATE_CMD_RSP_SENT
1452 && state
!= SRPT_STATE_MGMT_RSP_SENT
1453 && state
!= SRPT_STATE_DONE
))
1454 pr_debug("state = %d\n", state
);
1456 if (state
!= SRPT_STATE_DONE
)
1457 kref_put(&ioctx
->kref
, srpt_put_send_ioctx_kref
);
1459 printk(KERN_ERR
"IB completion has been received too late for"
1460 " wr_id = %u.\n", ioctx
->ioctx
.index
);
1464 * srpt_handle_rdma_comp() - Process an IB RDMA completion notification.
1466 * Note: transport_generic_handle_data() is asynchronous so unmapping the
1467 * data that has been transferred via IB RDMA must be postponed until the
1468 * check_stop_free() callback.
1470 static void srpt_handle_rdma_comp(struct srpt_rdma_ch
*ch
,
1471 struct srpt_send_ioctx
*ioctx
,
1472 enum srpt_opcode opcode
)
1474 WARN_ON(ioctx
->n_rdma
<= 0);
1475 atomic_add(ioctx
->n_rdma
, &ch
->sq_wr_avail
);
1477 if (opcode
== SRPT_RDMA_READ_LAST
) {
1478 if (srpt_test_and_set_cmd_state(ioctx
, SRPT_STATE_NEED_DATA
,
1479 SRPT_STATE_DATA_IN
))
1480 transport_generic_handle_data(&ioctx
->cmd
);
1482 printk(KERN_ERR
"%s[%d]: wrong state = %d\n", __func__
,
1483 __LINE__
, srpt_get_cmd_state(ioctx
));
1484 } else if (opcode
== SRPT_RDMA_ABORT
) {
1485 ioctx
->rdma_aborted
= true;
1487 WARN(true, "unexpected opcode %d\n", opcode
);
1492 * srpt_handle_rdma_err_comp() - Process an IB RDMA error completion.
1494 static void srpt_handle_rdma_err_comp(struct srpt_rdma_ch
*ch
,
1495 struct srpt_send_ioctx
*ioctx
,
1496 enum srpt_opcode opcode
)
1499 enum srpt_command_state state
;
1500 unsigned long flags
;
1503 state
= srpt_get_cmd_state(ioctx
);
1505 case SRPT_RDMA_READ_LAST
:
1506 if (ioctx
->n_rdma
<= 0) {
1507 printk(KERN_ERR
"Received invalid RDMA read"
1508 " error completion with idx %d\n",
1509 ioctx
->ioctx
.index
);
1512 atomic_add(ioctx
->n_rdma
, &ch
->sq_wr_avail
);
1513 if (state
== SRPT_STATE_NEED_DATA
)
1514 srpt_abort_cmd(ioctx
);
1516 printk(KERN_ERR
"%s[%d]: wrong state = %d\n",
1517 __func__
, __LINE__
, state
);
1519 case SRPT_RDMA_WRITE_LAST
:
1520 spin_lock_irqsave(&ioctx
->cmd
.t_state_lock
, flags
);
1521 ioctx
->cmd
.transport_state
|= CMD_T_LUN_STOP
;
1522 spin_unlock_irqrestore(&ioctx
->cmd
.t_state_lock
, flags
);
1525 printk(KERN_ERR
"%s[%d]: opcode = %u\n", __func__
,
1532 * srpt_build_cmd_rsp() - Build an SRP_RSP response.
1533 * @ch: RDMA channel through which the request has been received.
1534 * @ioctx: I/O context associated with the SRP_CMD request. The response will
1535 * be built in the buffer ioctx->buf points at and hence this function will
1536 * overwrite the request data.
1537 * @tag: tag of the request for which this response is being generated.
1538 * @status: value for the STATUS field of the SRP_RSP information unit.
1540 * Returns the size in bytes of the SRP_RSP response.
1542 * An SRP_RSP response contains a SCSI status or service response. See also
1543 * section 6.9 in the SRP r16a document for the format of an SRP_RSP
1544 * response. See also SPC-2 for more information about sense data.
1546 static int srpt_build_cmd_rsp(struct srpt_rdma_ch
*ch
,
1547 struct srpt_send_ioctx
*ioctx
, u64 tag
,
1550 struct srp_rsp
*srp_rsp
;
1551 const u8
*sense_data
;
1552 int sense_data_len
, max_sense_len
;
1555 * The lowest bit of all SAM-3 status codes is zero (see also
1556 * paragraph 5.3 in SAM-3).
1558 WARN_ON(status
& 1);
1560 srp_rsp
= ioctx
->ioctx
.buf
;
1563 sense_data
= ioctx
->sense_data
;
1564 sense_data_len
= ioctx
->cmd
.scsi_sense_length
;
1565 WARN_ON(sense_data_len
> sizeof(ioctx
->sense_data
));
1567 memset(srp_rsp
, 0, sizeof *srp_rsp
);
1568 srp_rsp
->opcode
= SRP_RSP
;
1569 srp_rsp
->req_lim_delta
=
1570 __constant_cpu_to_be32(1 + atomic_xchg(&ch
->req_lim_delta
, 0));
1572 srp_rsp
->status
= status
;
1574 if (sense_data_len
) {
1575 BUILD_BUG_ON(MIN_MAX_RSP_SIZE
<= sizeof(*srp_rsp
));
1576 max_sense_len
= ch
->max_ti_iu_len
- sizeof(*srp_rsp
);
1577 if (sense_data_len
> max_sense_len
) {
1578 printk(KERN_WARNING
"truncated sense data from %d to %d"
1579 " bytes\n", sense_data_len
, max_sense_len
);
1580 sense_data_len
= max_sense_len
;
1583 srp_rsp
->flags
|= SRP_RSP_FLAG_SNSVALID
;
1584 srp_rsp
->sense_data_len
= cpu_to_be32(sense_data_len
);
1585 memcpy(srp_rsp
+ 1, sense_data
, sense_data_len
);
1588 return sizeof(*srp_rsp
) + sense_data_len
;
1592 * srpt_build_tskmgmt_rsp() - Build a task management response.
1593 * @ch: RDMA channel through which the request has been received.
1594 * @ioctx: I/O context in which the SRP_RSP response will be built.
1595 * @rsp_code: RSP_CODE that will be stored in the response.
1596 * @tag: Tag of the request for which this response is being generated.
1598 * Returns the size in bytes of the SRP_RSP response.
1600 * An SRP_RSP response contains a SCSI status or service response. See also
1601 * section 6.9 in the SRP r16a document for the format of an SRP_RSP
1604 static int srpt_build_tskmgmt_rsp(struct srpt_rdma_ch
*ch
,
1605 struct srpt_send_ioctx
*ioctx
,
1606 u8 rsp_code
, u64 tag
)
1608 struct srp_rsp
*srp_rsp
;
1612 resp_data_len
= (rsp_code
== SRP_TSK_MGMT_SUCCESS
) ? 0 : 4;
1613 resp_len
= sizeof(*srp_rsp
) + resp_data_len
;
1615 srp_rsp
= ioctx
->ioctx
.buf
;
1617 memset(srp_rsp
, 0, sizeof *srp_rsp
);
1619 srp_rsp
->opcode
= SRP_RSP
;
1620 srp_rsp
->req_lim_delta
= __constant_cpu_to_be32(1
1621 + atomic_xchg(&ch
->req_lim_delta
, 0));
1624 if (rsp_code
!= SRP_TSK_MGMT_SUCCESS
) {
1625 srp_rsp
->flags
|= SRP_RSP_FLAG_RSPVALID
;
1626 srp_rsp
->resp_data_len
= cpu_to_be32(resp_data_len
);
1627 srp_rsp
->data
[3] = rsp_code
;
1633 #define NO_SUCH_LUN ((uint64_t)-1LL)
1636 * SCSI LUN addressing method. See also SAM-2 and the section about
1639 enum scsi_lun_addr_method
{
1640 SCSI_LUN_ADDR_METHOD_PERIPHERAL
= 0,
1641 SCSI_LUN_ADDR_METHOD_FLAT
= 1,
1642 SCSI_LUN_ADDR_METHOD_LUN
= 2,
1643 SCSI_LUN_ADDR_METHOD_EXTENDED_LUN
= 3,
1647 * srpt_unpack_lun() - Convert from network LUN to linear LUN.
1649 * Convert an 2-byte, 4-byte, 6-byte or 8-byte LUN structure in network byte
1650 * order (big endian) to a linear LUN. Supports three LUN addressing methods:
1651 * peripheral, flat and logical unit. See also SAM-2, section 4.9.4 (page 40).
1653 static uint64_t srpt_unpack_lun(const uint8_t *lun
, int len
)
1655 uint64_t res
= NO_SUCH_LUN
;
1656 int addressing_method
;
1658 if (unlikely(len
< 2)) {
1659 printk(KERN_ERR
"Illegal LUN length %d, expected 2 bytes or "
1666 if ((*((__be64
*)lun
) &
1667 __constant_cpu_to_be64(0x0000FFFFFFFFFFFFLL
)) != 0)
1671 if (*((__be16
*)&lun
[2]) != 0)
1675 if (*((__be32
*)&lun
[2]) != 0)
1684 addressing_method
= (*lun
) >> 6; /* highest two bits of byte 0 */
1685 switch (addressing_method
) {
1686 case SCSI_LUN_ADDR_METHOD_PERIPHERAL
:
1687 case SCSI_LUN_ADDR_METHOD_FLAT
:
1688 case SCSI_LUN_ADDR_METHOD_LUN
:
1689 res
= *(lun
+ 1) | (((*lun
) & 0x3f) << 8);
1692 case SCSI_LUN_ADDR_METHOD_EXTENDED_LUN
:
1694 printk(KERN_ERR
"Unimplemented LUN addressing method %u",
1703 printk(KERN_ERR
"Support for multi-level LUNs has not yet been"
1708 static int srpt_check_stop_free(struct se_cmd
*cmd
)
1710 struct srpt_send_ioctx
*ioctx
;
1712 ioctx
= container_of(cmd
, struct srpt_send_ioctx
, cmd
);
1713 return kref_put(&ioctx
->kref
, srpt_put_send_ioctx_kref
);
1717 * srpt_handle_cmd() - Process SRP_CMD.
1719 static int srpt_handle_cmd(struct srpt_rdma_ch
*ch
,
1720 struct srpt_recv_ioctx
*recv_ioctx
,
1721 struct srpt_send_ioctx
*send_ioctx
)
1724 struct srp_cmd
*srp_cmd
;
1725 uint64_t unpacked_lun
;
1727 enum dma_data_direction dir
;
1730 BUG_ON(!send_ioctx
);
1732 srp_cmd
= recv_ioctx
->ioctx
.buf
;
1733 kref_get(&send_ioctx
->kref
);
1734 cmd
= &send_ioctx
->cmd
;
1735 send_ioctx
->tag
= srp_cmd
->tag
;
1737 switch (srp_cmd
->task_attr
) {
1738 case SRP_CMD_SIMPLE_Q
:
1739 cmd
->sam_task_attr
= MSG_SIMPLE_TAG
;
1741 case SRP_CMD_ORDERED_Q
:
1743 cmd
->sam_task_attr
= MSG_ORDERED_TAG
;
1745 case SRP_CMD_HEAD_OF_Q
:
1746 cmd
->sam_task_attr
= MSG_HEAD_TAG
;
1749 cmd
->sam_task_attr
= MSG_ACA_TAG
;
1753 ret
= srpt_get_desc_tbl(send_ioctx
, srp_cmd
, &dir
, &data_len
);
1755 printk(KERN_ERR
"0x%llx: parsing SRP descriptor table failed.\n",
1757 cmd
->se_cmd_flags
|= SCF_SCSI_CDB_EXCEPTION
;
1758 cmd
->scsi_sense_reason
= TCM_INVALID_CDB_FIELD
;
1759 kref_put(&send_ioctx
->kref
, srpt_put_send_ioctx_kref
);
1763 cmd
->data_length
= data_len
;
1764 cmd
->data_direction
= dir
;
1765 unpacked_lun
= srpt_unpack_lun((uint8_t *)&srp_cmd
->lun
,
1766 sizeof(srp_cmd
->lun
));
1767 if (transport_lookup_cmd_lun(cmd
, unpacked_lun
) < 0) {
1768 kref_put(&send_ioctx
->kref
, srpt_put_send_ioctx_kref
);
1771 ret
= target_setup_cmd_from_cdb(cmd
, srp_cmd
->cdb
);
1773 kref_put(&send_ioctx
->kref
, srpt_put_send_ioctx_kref
);
1774 if (cmd
->se_cmd_flags
& SCF_SCSI_RESERVATION_CONFLICT
) {
1775 srpt_queue_status(cmd
);
1781 transport_handle_cdb_direct(cmd
);
1785 transport_send_check_condition_and_sense(cmd
, cmd
->scsi_sense_reason
,
1791 * srpt_rx_mgmt_fn_tag() - Process a task management function by tag.
1792 * @ch: RDMA channel of the task management request.
1793 * @fn: Task management function to perform.
1794 * @req_tag: Tag of the SRP task management request.
1795 * @mgmt_ioctx: I/O context of the task management request.
1797 * Returns zero if the target core will process the task management
1798 * request asynchronously.
1800 * Note: It is assumed that the initiator serializes tag-based task management
1803 static int srpt_rx_mgmt_fn_tag(struct srpt_send_ioctx
*ioctx
, u64 tag
)
1805 struct srpt_device
*sdev
;
1806 struct srpt_rdma_ch
*ch
;
1807 struct srpt_send_ioctx
*target
;
1814 sdev
= ch
->sport
->sdev
;
1816 spin_lock_irq(&sdev
->spinlock
);
1817 for (i
= 0; i
< ch
->rq_size
; ++i
) {
1818 target
= ch
->ioctx_ring
[i
];
1819 if (target
->cmd
.se_lun
== ioctx
->cmd
.se_lun
&&
1820 target
->tag
== tag
&&
1821 srpt_get_cmd_state(target
) != SRPT_STATE_DONE
) {
1823 /* now let the target core abort &target->cmd; */
1827 spin_unlock_irq(&sdev
->spinlock
);
1831 static int srp_tmr_to_tcm(int fn
)
1834 case SRP_TSK_ABORT_TASK
:
1835 return TMR_ABORT_TASK
;
1836 case SRP_TSK_ABORT_TASK_SET
:
1837 return TMR_ABORT_TASK_SET
;
1838 case SRP_TSK_CLEAR_TASK_SET
:
1839 return TMR_CLEAR_TASK_SET
;
1840 case SRP_TSK_LUN_RESET
:
1841 return TMR_LUN_RESET
;
1842 case SRP_TSK_CLEAR_ACA
:
1843 return TMR_CLEAR_ACA
;
1850 * srpt_handle_tsk_mgmt() - Process an SRP_TSK_MGMT information unit.
1852 * Returns 0 if and only if the request will be processed by the target core.
1854 * For more information about SRP_TSK_MGMT information units, see also section
1855 * 6.7 in the SRP r16a document.
1857 static void srpt_handle_tsk_mgmt(struct srpt_rdma_ch
*ch
,
1858 struct srpt_recv_ioctx
*recv_ioctx
,
1859 struct srpt_send_ioctx
*send_ioctx
)
1861 struct srp_tsk_mgmt
*srp_tsk
;
1863 uint64_t unpacked_lun
;
1867 BUG_ON(!send_ioctx
);
1869 srp_tsk
= recv_ioctx
->ioctx
.buf
;
1870 cmd
= &send_ioctx
->cmd
;
1872 pr_debug("recv tsk_mgmt fn %d for task_tag %lld and cmd tag %lld"
1873 " cm_id %p sess %p\n", srp_tsk
->tsk_mgmt_func
,
1874 srp_tsk
->task_tag
, srp_tsk
->tag
, ch
->cm_id
, ch
->sess
);
1876 srpt_set_cmd_state(send_ioctx
, SRPT_STATE_MGMT
);
1877 send_ioctx
->tag
= srp_tsk
->tag
;
1878 tcm_tmr
= srp_tmr_to_tcm(srp_tsk
->tsk_mgmt_func
);
1880 send_ioctx
->cmd
.se_cmd_flags
|= SCF_SCSI_CDB_EXCEPTION
;
1881 send_ioctx
->cmd
.se_tmr_req
->response
=
1882 TMR_TASK_MGMT_FUNCTION_NOT_SUPPORTED
;
1885 res
= core_tmr_alloc_req(cmd
, NULL
, tcm_tmr
, GFP_KERNEL
);
1887 send_ioctx
->cmd
.se_cmd_flags
|= SCF_SCSI_CDB_EXCEPTION
;
1888 send_ioctx
->cmd
.se_tmr_req
->response
= TMR_FUNCTION_REJECTED
;
1892 unpacked_lun
= srpt_unpack_lun((uint8_t *)&srp_tsk
->lun
,
1893 sizeof(srp_tsk
->lun
));
1894 res
= transport_lookup_tmr_lun(&send_ioctx
->cmd
, unpacked_lun
);
1896 pr_debug("rejecting TMR for LUN %lld\n", unpacked_lun
);
1897 send_ioctx
->cmd
.se_cmd_flags
|= SCF_SCSI_CDB_EXCEPTION
;
1898 send_ioctx
->cmd
.se_tmr_req
->response
= TMR_LUN_DOES_NOT_EXIST
;
1902 if (srp_tsk
->tsk_mgmt_func
== SRP_TSK_ABORT_TASK
)
1903 srpt_rx_mgmt_fn_tag(send_ioctx
, srp_tsk
->task_tag
);
1906 kref_get(&send_ioctx
->kref
);
1907 if (!(send_ioctx
->cmd
.se_cmd_flags
& SCF_SCSI_CDB_EXCEPTION
))
1908 transport_generic_handle_tmr(&send_ioctx
->cmd
);
1910 transport_send_check_condition_and_sense(cmd
,
1911 cmd
->scsi_sense_reason
, 0);
1916 * srpt_handle_new_iu() - Process a newly received information unit.
1917 * @ch: RDMA channel through which the information unit has been received.
1918 * @ioctx: SRPT I/O context associated with the information unit.
1920 static void srpt_handle_new_iu(struct srpt_rdma_ch
*ch
,
1921 struct srpt_recv_ioctx
*recv_ioctx
,
1922 struct srpt_send_ioctx
*send_ioctx
)
1924 struct srp_cmd
*srp_cmd
;
1925 enum rdma_ch_state ch_state
;
1928 BUG_ON(!recv_ioctx
);
1930 ib_dma_sync_single_for_cpu(ch
->sport
->sdev
->device
,
1931 recv_ioctx
->ioctx
.dma
, srp_max_req_size
,
1934 ch_state
= srpt_get_ch_state(ch
);
1935 if (unlikely(ch_state
== CH_CONNECTING
)) {
1936 list_add_tail(&recv_ioctx
->wait_list
, &ch
->cmd_wait_list
);
1940 if (unlikely(ch_state
!= CH_LIVE
))
1943 srp_cmd
= recv_ioctx
->ioctx
.buf
;
1944 if (srp_cmd
->opcode
== SRP_CMD
|| srp_cmd
->opcode
== SRP_TSK_MGMT
) {
1946 send_ioctx
= srpt_get_send_ioctx(ch
);
1947 if (unlikely(!send_ioctx
)) {
1948 list_add_tail(&recv_ioctx
->wait_list
,
1949 &ch
->cmd_wait_list
);
1954 transport_init_se_cmd(&send_ioctx
->cmd
, &srpt_target
->tf_ops
, ch
->sess
,
1955 0, DMA_NONE
, MSG_SIMPLE_TAG
,
1956 send_ioctx
->sense_data
);
1958 switch (srp_cmd
->opcode
) {
1960 srpt_handle_cmd(ch
, recv_ioctx
, send_ioctx
);
1963 srpt_handle_tsk_mgmt(ch
, recv_ioctx
, send_ioctx
);
1966 printk(KERN_ERR
"Not yet implemented: SRP_I_LOGOUT\n");
1969 pr_debug("received SRP_CRED_RSP\n");
1972 pr_debug("received SRP_AER_RSP\n");
1975 printk(KERN_ERR
"Received SRP_RSP\n");
1978 printk(KERN_ERR
"received IU with unknown opcode 0x%x\n",
1983 srpt_post_recv(ch
->sport
->sdev
, recv_ioctx
);
1988 static void srpt_process_rcv_completion(struct ib_cq
*cq
,
1989 struct srpt_rdma_ch
*ch
,
1992 struct srpt_device
*sdev
= ch
->sport
->sdev
;
1993 struct srpt_recv_ioctx
*ioctx
;
1996 index
= idx_from_wr_id(wc
->wr_id
);
1997 if (wc
->status
== IB_WC_SUCCESS
) {
2000 req_lim
= atomic_dec_return(&ch
->req_lim
);
2001 if (unlikely(req_lim
< 0))
2002 printk(KERN_ERR
"req_lim = %d < 0\n", req_lim
);
2003 ioctx
= sdev
->ioctx_ring
[index
];
2004 srpt_handle_new_iu(ch
, ioctx
, NULL
);
2006 printk(KERN_INFO
"receiving failed for idx %u with status %d\n",
2012 * srpt_process_send_completion() - Process an IB send completion.
2014 * Note: Although this has not yet been observed during tests, at least in
2015 * theory it is possible that the srpt_get_send_ioctx() call invoked by
2016 * srpt_handle_new_iu() fails. This is possible because the req_lim_delta
2017 * value in each response is set to one, and it is possible that this response
2018 * makes the initiator send a new request before the send completion for that
2019 * response has been processed. This could e.g. happen if the call to
2020 * srpt_put_send_iotcx() is delayed because of a higher priority interrupt or
2021 * if IB retransmission causes generation of the send completion to be
2022 * delayed. Incoming information units for which srpt_get_send_ioctx() fails
2023 * are queued on cmd_wait_list. The code below processes these delayed
2024 * requests one at a time.
2026 static void srpt_process_send_completion(struct ib_cq
*cq
,
2027 struct srpt_rdma_ch
*ch
,
2030 struct srpt_send_ioctx
*send_ioctx
;
2032 enum srpt_opcode opcode
;
2034 index
= idx_from_wr_id(wc
->wr_id
);
2035 opcode
= opcode_from_wr_id(wc
->wr_id
);
2036 send_ioctx
= ch
->ioctx_ring
[index
];
2037 if (wc
->status
== IB_WC_SUCCESS
) {
2038 if (opcode
== SRPT_SEND
)
2039 srpt_handle_send_comp(ch
, send_ioctx
);
2041 WARN_ON(opcode
!= SRPT_RDMA_ABORT
&&
2042 wc
->opcode
!= IB_WC_RDMA_READ
);
2043 srpt_handle_rdma_comp(ch
, send_ioctx
, opcode
);
2046 if (opcode
== SRPT_SEND
) {
2047 printk(KERN_INFO
"sending response for idx %u failed"
2048 " with status %d\n", index
, wc
->status
);
2049 srpt_handle_send_err_comp(ch
, wc
->wr_id
);
2050 } else if (opcode
!= SRPT_RDMA_MID
) {
2051 printk(KERN_INFO
"RDMA t %d for idx %u failed with"
2052 " status %d", opcode
, index
, wc
->status
);
2053 srpt_handle_rdma_err_comp(ch
, send_ioctx
, opcode
);
2057 while (unlikely(opcode
== SRPT_SEND
2058 && !list_empty(&ch
->cmd_wait_list
)
2059 && srpt_get_ch_state(ch
) == CH_LIVE
2060 && (send_ioctx
= srpt_get_send_ioctx(ch
)) != NULL
)) {
2061 struct srpt_recv_ioctx
*recv_ioctx
;
2063 recv_ioctx
= list_first_entry(&ch
->cmd_wait_list
,
2064 struct srpt_recv_ioctx
,
2066 list_del(&recv_ioctx
->wait_list
);
2067 srpt_handle_new_iu(ch
, recv_ioctx
, send_ioctx
);
2071 static void srpt_process_completion(struct ib_cq
*cq
, struct srpt_rdma_ch
*ch
)
2073 struct ib_wc
*const wc
= ch
->wc
;
2076 WARN_ON(cq
!= ch
->cq
);
2078 ib_req_notify_cq(cq
, IB_CQ_NEXT_COMP
);
2079 while ((n
= ib_poll_cq(cq
, ARRAY_SIZE(ch
->wc
), wc
)) > 0) {
2080 for (i
= 0; i
< n
; i
++) {
2081 if (opcode_from_wr_id(wc
[i
].wr_id
) == SRPT_RECV
)
2082 srpt_process_rcv_completion(cq
, ch
, &wc
[i
]);
2084 srpt_process_send_completion(cq
, ch
, &wc
[i
]);
2090 * srpt_completion() - IB completion queue callback function.
2093 * - It is guaranteed that a completion handler will never be invoked
2094 * concurrently on two different CPUs for the same completion queue. See also
2095 * Documentation/infiniband/core_locking.txt and the implementation of
2096 * handle_edge_irq() in kernel/irq/chip.c.
2097 * - When threaded IRQs are enabled, completion handlers are invoked in thread
2098 * context instead of interrupt context.
2100 static void srpt_completion(struct ib_cq
*cq
, void *ctx
)
2102 struct srpt_rdma_ch
*ch
= ctx
;
2104 wake_up_interruptible(&ch
->wait_queue
);
2107 static int srpt_compl_thread(void *arg
)
2109 struct srpt_rdma_ch
*ch
;
2111 /* Hibernation / freezing of the SRPT kernel thread is not supported. */
2112 current
->flags
|= PF_NOFREEZE
;
2116 printk(KERN_INFO
"Session %s: kernel thread %s (PID %d) started\n",
2117 ch
->sess_name
, ch
->thread
->comm
, current
->pid
);
2118 while (!kthread_should_stop()) {
2119 wait_event_interruptible(ch
->wait_queue
,
2120 (srpt_process_completion(ch
->cq
, ch
),
2121 kthread_should_stop()));
2123 printk(KERN_INFO
"Session %s: kernel thread %s (PID %d) stopped\n",
2124 ch
->sess_name
, ch
->thread
->comm
, current
->pid
);
2129 * srpt_create_ch_ib() - Create receive and send completion queues.
2131 static int srpt_create_ch_ib(struct srpt_rdma_ch
*ch
)
2133 struct ib_qp_init_attr
*qp_init
;
2134 struct srpt_port
*sport
= ch
->sport
;
2135 struct srpt_device
*sdev
= sport
->sdev
;
2136 u32 srp_sq_size
= sport
->port_attrib
.srp_sq_size
;
2139 WARN_ON(ch
->rq_size
< 1);
2142 qp_init
= kzalloc(sizeof *qp_init
, GFP_KERNEL
);
2146 ch
->cq
= ib_create_cq(sdev
->device
, srpt_completion
, NULL
, ch
,
2147 ch
->rq_size
+ srp_sq_size
, 0);
2148 if (IS_ERR(ch
->cq
)) {
2149 ret
= PTR_ERR(ch
->cq
);
2150 printk(KERN_ERR
"failed to create CQ cqe= %d ret= %d\n",
2151 ch
->rq_size
+ srp_sq_size
, ret
);
2155 qp_init
->qp_context
= (void *)ch
;
2156 qp_init
->event_handler
2157 = (void(*)(struct ib_event
*, void*))srpt_qp_event
;
2158 qp_init
->send_cq
= ch
->cq
;
2159 qp_init
->recv_cq
= ch
->cq
;
2160 qp_init
->srq
= sdev
->srq
;
2161 qp_init
->sq_sig_type
= IB_SIGNAL_REQ_WR
;
2162 qp_init
->qp_type
= IB_QPT_RC
;
2163 qp_init
->cap
.max_send_wr
= srp_sq_size
;
2164 qp_init
->cap
.max_send_sge
= SRPT_DEF_SG_PER_WQE
;
2166 ch
->qp
= ib_create_qp(sdev
->pd
, qp_init
);
2167 if (IS_ERR(ch
->qp
)) {
2168 ret
= PTR_ERR(ch
->qp
);
2169 printk(KERN_ERR
"failed to create_qp ret= %d\n", ret
);
2170 goto err_destroy_cq
;
2173 atomic_set(&ch
->sq_wr_avail
, qp_init
->cap
.max_send_wr
);
2175 pr_debug("%s: max_cqe= %d max_sge= %d sq_size = %d cm_id= %p\n",
2176 __func__
, ch
->cq
->cqe
, qp_init
->cap
.max_send_sge
,
2177 qp_init
->cap
.max_send_wr
, ch
->cm_id
);
2179 ret
= srpt_init_ch_qp(ch
, ch
->qp
);
2181 goto err_destroy_qp
;
2183 init_waitqueue_head(&ch
->wait_queue
);
2185 pr_debug("creating thread for session %s\n", ch
->sess_name
);
2187 ch
->thread
= kthread_run(srpt_compl_thread
, ch
, "ib_srpt_compl");
2188 if (IS_ERR(ch
->thread
)) {
2189 printk(KERN_ERR
"failed to create kernel thread %ld\n",
2190 PTR_ERR(ch
->thread
));
2192 goto err_destroy_qp
;
2200 ib_destroy_qp(ch
->qp
);
2202 ib_destroy_cq(ch
->cq
);
2206 static void srpt_destroy_ch_ib(struct srpt_rdma_ch
*ch
)
2209 kthread_stop(ch
->thread
);
2211 ib_destroy_qp(ch
->qp
);
2212 ib_destroy_cq(ch
->cq
);
2216 * __srpt_close_ch() - Close an RDMA channel by setting the QP error state.
2218 * Reset the QP and make sure all resources associated with the channel will
2219 * be deallocated at an appropriate time.
2221 * Note: The caller must hold ch->sport->sdev->spinlock.
2223 static void __srpt_close_ch(struct srpt_rdma_ch
*ch
)
2225 struct srpt_device
*sdev
;
2226 enum rdma_ch_state prev_state
;
2227 unsigned long flags
;
2229 sdev
= ch
->sport
->sdev
;
2231 spin_lock_irqsave(&ch
->spinlock
, flags
);
2232 prev_state
= ch
->state
;
2233 switch (prev_state
) {
2236 ch
->state
= CH_DISCONNECTING
;
2241 spin_unlock_irqrestore(&ch
->spinlock
, flags
);
2243 switch (prev_state
) {
2245 ib_send_cm_rej(ch
->cm_id
, IB_CM_REJ_NO_RESOURCES
, NULL
, 0,
2249 if (ib_send_cm_dreq(ch
->cm_id
, NULL
, 0) < 0)
2250 printk(KERN_ERR
"sending CM DREQ failed.\n");
2252 case CH_DISCONNECTING
:
2261 * srpt_close_ch() - Close an RDMA channel.
2263 static void srpt_close_ch(struct srpt_rdma_ch
*ch
)
2265 struct srpt_device
*sdev
;
2267 sdev
= ch
->sport
->sdev
;
2268 spin_lock_irq(&sdev
->spinlock
);
2269 __srpt_close_ch(ch
);
2270 spin_unlock_irq(&sdev
->spinlock
);
2274 * srpt_drain_channel() - Drain a channel by resetting the IB queue pair.
2275 * @cm_id: Pointer to the CM ID of the channel to be drained.
2277 * Note: Must be called from inside srpt_cm_handler to avoid a race between
2278 * accessing sdev->spinlock and the call to kfree(sdev) in srpt_remove_one()
2279 * (the caller of srpt_cm_handler holds the cm_id spinlock; srpt_remove_one()
2280 * waits until all target sessions for the associated IB device have been
2281 * unregistered and target session registration involves a call to
2282 * ib_destroy_cm_id(), which locks the cm_id spinlock and hence waits until
2283 * this function has finished).
2285 static void srpt_drain_channel(struct ib_cm_id
*cm_id
)
2287 struct srpt_device
*sdev
;
2288 struct srpt_rdma_ch
*ch
;
2290 bool do_reset
= false;
2292 WARN_ON_ONCE(irqs_disabled());
2294 sdev
= cm_id
->context
;
2296 spin_lock_irq(&sdev
->spinlock
);
2297 list_for_each_entry(ch
, &sdev
->rch_list
, list
) {
2298 if (ch
->cm_id
== cm_id
) {
2299 do_reset
= srpt_test_and_set_ch_state(ch
,
2300 CH_CONNECTING
, CH_DRAINING
) ||
2301 srpt_test_and_set_ch_state(ch
,
2302 CH_LIVE
, CH_DRAINING
) ||
2303 srpt_test_and_set_ch_state(ch
,
2304 CH_DISCONNECTING
, CH_DRAINING
);
2308 spin_unlock_irq(&sdev
->spinlock
);
2311 ret
= srpt_ch_qp_err(ch
);
2313 printk(KERN_ERR
"Setting queue pair in error state"
2314 " failed: %d\n", ret
);
2319 * srpt_find_channel() - Look up an RDMA channel.
2320 * @cm_id: Pointer to the CM ID of the channel to be looked up.
2322 * Return NULL if no matching RDMA channel has been found.
2324 static struct srpt_rdma_ch
*srpt_find_channel(struct srpt_device
*sdev
,
2325 struct ib_cm_id
*cm_id
)
2327 struct srpt_rdma_ch
*ch
;
2330 WARN_ON_ONCE(irqs_disabled());
2334 spin_lock_irq(&sdev
->spinlock
);
2335 list_for_each_entry(ch
, &sdev
->rch_list
, list
) {
2336 if (ch
->cm_id
== cm_id
) {
2341 spin_unlock_irq(&sdev
->spinlock
);
2343 return found
? ch
: NULL
;
2347 * srpt_release_channel() - Release channel resources.
2349 * Schedules the actual release because:
2350 * - Calling the ib_destroy_cm_id() call from inside an IB CM callback would
2351 * trigger a deadlock.
2352 * - It is not safe to call TCM transport_* functions from interrupt context.
2354 static void srpt_release_channel(struct srpt_rdma_ch
*ch
)
2356 schedule_work(&ch
->release_work
);
2359 static void srpt_release_channel_work(struct work_struct
*w
)
2361 struct srpt_rdma_ch
*ch
;
2362 struct srpt_device
*sdev
;
2364 ch
= container_of(w
, struct srpt_rdma_ch
, release_work
);
2365 pr_debug("ch = %p; ch->sess = %p; release_done = %p\n", ch
, ch
->sess
,
2368 sdev
= ch
->sport
->sdev
;
2371 transport_deregister_session_configfs(ch
->sess
);
2372 transport_deregister_session(ch
->sess
);
2375 srpt_destroy_ch_ib(ch
);
2377 srpt_free_ioctx_ring((struct srpt_ioctx
**)ch
->ioctx_ring
,
2378 ch
->sport
->sdev
, ch
->rq_size
,
2379 ch
->rsp_size
, DMA_TO_DEVICE
);
2381 spin_lock_irq(&sdev
->spinlock
);
2382 list_del(&ch
->list
);
2383 spin_unlock_irq(&sdev
->spinlock
);
2385 ib_destroy_cm_id(ch
->cm_id
);
2387 if (ch
->release_done
)
2388 complete(ch
->release_done
);
2390 wake_up(&sdev
->ch_releaseQ
);
2395 static struct srpt_node_acl
*__srpt_lookup_acl(struct srpt_port
*sport
,
2398 struct srpt_node_acl
*nacl
;
2400 list_for_each_entry(nacl
, &sport
->port_acl_list
, list
)
2401 if (memcmp(nacl
->i_port_id
, i_port_id
,
2402 sizeof(nacl
->i_port_id
)) == 0)
2408 static struct srpt_node_acl
*srpt_lookup_acl(struct srpt_port
*sport
,
2411 struct srpt_node_acl
*nacl
;
2413 spin_lock_irq(&sport
->port_acl_lock
);
2414 nacl
= __srpt_lookup_acl(sport
, i_port_id
);
2415 spin_unlock_irq(&sport
->port_acl_lock
);
2421 * srpt_cm_req_recv() - Process the event IB_CM_REQ_RECEIVED.
2423 * Ownership of the cm_id is transferred to the target session if this
2424 * functions returns zero. Otherwise the caller remains the owner of cm_id.
2426 static int srpt_cm_req_recv(struct ib_cm_id
*cm_id
,
2427 struct ib_cm_req_event_param
*param
,
2430 struct srpt_device
*sdev
= cm_id
->context
;
2431 struct srpt_port
*sport
= &sdev
->port
[param
->port
- 1];
2432 struct srp_login_req
*req
;
2433 struct srp_login_rsp
*rsp
;
2434 struct srp_login_rej
*rej
;
2435 struct ib_cm_rep_param
*rep_param
;
2436 struct srpt_rdma_ch
*ch
, *tmp_ch
;
2437 struct srpt_node_acl
*nacl
;
2442 WARN_ON_ONCE(irqs_disabled());
2444 if (WARN_ON(!sdev
|| !private_data
))
2447 req
= (struct srp_login_req
*)private_data
;
2449 it_iu_len
= be32_to_cpu(req
->req_it_iu_len
);
2451 printk(KERN_INFO
"Received SRP_LOGIN_REQ with i_port_id 0x%llx:0x%llx,"
2452 " t_port_id 0x%llx:0x%llx and it_iu_len %d on port %d"
2453 " (guid=0x%llx:0x%llx)\n",
2454 be64_to_cpu(*(__be64
*)&req
->initiator_port_id
[0]),
2455 be64_to_cpu(*(__be64
*)&req
->initiator_port_id
[8]),
2456 be64_to_cpu(*(__be64
*)&req
->target_port_id
[0]),
2457 be64_to_cpu(*(__be64
*)&req
->target_port_id
[8]),
2460 be64_to_cpu(*(__be64
*)&sdev
->port
[param
->port
- 1].gid
.raw
[0]),
2461 be64_to_cpu(*(__be64
*)&sdev
->port
[param
->port
- 1].gid
.raw
[8]));
2463 rsp
= kzalloc(sizeof *rsp
, GFP_KERNEL
);
2464 rej
= kzalloc(sizeof *rej
, GFP_KERNEL
);
2465 rep_param
= kzalloc(sizeof *rep_param
, GFP_KERNEL
);
2467 if (!rsp
|| !rej
|| !rep_param
) {
2472 if (it_iu_len
> srp_max_req_size
|| it_iu_len
< 64) {
2473 rej
->reason
= __constant_cpu_to_be32(
2474 SRP_LOGIN_REJ_REQ_IT_IU_LENGTH_TOO_LARGE
);
2476 printk(KERN_ERR
"rejected SRP_LOGIN_REQ because its"
2477 " length (%d bytes) is out of range (%d .. %d)\n",
2478 it_iu_len
, 64, srp_max_req_size
);
2482 if (!sport
->enabled
) {
2483 rej
->reason
= __constant_cpu_to_be32(
2484 SRP_LOGIN_REJ_INSUFFICIENT_RESOURCES
);
2486 printk(KERN_ERR
"rejected SRP_LOGIN_REQ because the target port"
2487 " has not yet been enabled\n");
2491 if ((req
->req_flags
& SRP_MTCH_ACTION
) == SRP_MULTICHAN_SINGLE
) {
2492 rsp
->rsp_flags
= SRP_LOGIN_RSP_MULTICHAN_NO_CHAN
;
2494 spin_lock_irq(&sdev
->spinlock
);
2496 list_for_each_entry_safe(ch
, tmp_ch
, &sdev
->rch_list
, list
) {
2497 if (!memcmp(ch
->i_port_id
, req
->initiator_port_id
, 16)
2498 && !memcmp(ch
->t_port_id
, req
->target_port_id
, 16)
2499 && param
->port
== ch
->sport
->port
2500 && param
->listen_id
== ch
->sport
->sdev
->cm_id
2502 enum rdma_ch_state ch_state
;
2504 ch_state
= srpt_get_ch_state(ch
);
2505 if (ch_state
!= CH_CONNECTING
2506 && ch_state
!= CH_LIVE
)
2509 /* found an existing channel */
2510 pr_debug("Found existing channel %s"
2511 " cm_id= %p state= %d\n",
2512 ch
->sess_name
, ch
->cm_id
, ch_state
);
2514 __srpt_close_ch(ch
);
2517 SRP_LOGIN_RSP_MULTICHAN_TERMINATED
;
2521 spin_unlock_irq(&sdev
->spinlock
);
2524 rsp
->rsp_flags
= SRP_LOGIN_RSP_MULTICHAN_MAINTAINED
;
2526 if (*(__be64
*)req
->target_port_id
!= cpu_to_be64(srpt_service_guid
)
2527 || *(__be64
*)(req
->target_port_id
+ 8) !=
2528 cpu_to_be64(srpt_service_guid
)) {
2529 rej
->reason
= __constant_cpu_to_be32(
2530 SRP_LOGIN_REJ_UNABLE_ASSOCIATE_CHANNEL
);
2532 printk(KERN_ERR
"rejected SRP_LOGIN_REQ because it"
2533 " has an invalid target port identifier.\n");
2537 ch
= kzalloc(sizeof *ch
, GFP_KERNEL
);
2539 rej
->reason
= __constant_cpu_to_be32(
2540 SRP_LOGIN_REJ_INSUFFICIENT_RESOURCES
);
2541 printk(KERN_ERR
"rejected SRP_LOGIN_REQ because no memory.\n");
2546 INIT_WORK(&ch
->release_work
, srpt_release_channel_work
);
2547 memcpy(ch
->i_port_id
, req
->initiator_port_id
, 16);
2548 memcpy(ch
->t_port_id
, req
->target_port_id
, 16);
2549 ch
->sport
= &sdev
->port
[param
->port
- 1];
2552 * Avoid QUEUE_FULL conditions by limiting the number of buffers used
2553 * for the SRP protocol to the command queue size.
2555 ch
->rq_size
= SRPT_RQ_SIZE
;
2556 spin_lock_init(&ch
->spinlock
);
2557 ch
->state
= CH_CONNECTING
;
2558 INIT_LIST_HEAD(&ch
->cmd_wait_list
);
2559 ch
->rsp_size
= ch
->sport
->port_attrib
.srp_max_rsp_size
;
2561 ch
->ioctx_ring
= (struct srpt_send_ioctx
**)
2562 srpt_alloc_ioctx_ring(ch
->sport
->sdev
, ch
->rq_size
,
2563 sizeof(*ch
->ioctx_ring
[0]),
2564 ch
->rsp_size
, DMA_TO_DEVICE
);
2565 if (!ch
->ioctx_ring
)
2568 INIT_LIST_HEAD(&ch
->free_list
);
2569 for (i
= 0; i
< ch
->rq_size
; i
++) {
2570 ch
->ioctx_ring
[i
]->ch
= ch
;
2571 list_add_tail(&ch
->ioctx_ring
[i
]->free_list
, &ch
->free_list
);
2574 ret
= srpt_create_ch_ib(ch
);
2576 rej
->reason
= __constant_cpu_to_be32(
2577 SRP_LOGIN_REJ_INSUFFICIENT_RESOURCES
);
2578 printk(KERN_ERR
"rejected SRP_LOGIN_REQ because creating"
2579 " a new RDMA channel failed.\n");
2583 ret
= srpt_ch_qp_rtr(ch
, ch
->qp
);
2585 rej
->reason
= __constant_cpu_to_be32(
2586 SRP_LOGIN_REJ_INSUFFICIENT_RESOURCES
);
2587 printk(KERN_ERR
"rejected SRP_LOGIN_REQ because enabling"
2588 " RTR failed (error code = %d)\n", ret
);
2592 * Use the initator port identifier as the session name.
2594 snprintf(ch
->sess_name
, sizeof(ch
->sess_name
), "0x%016llx%016llx",
2595 be64_to_cpu(*(__be64
*)ch
->i_port_id
),
2596 be64_to_cpu(*(__be64
*)(ch
->i_port_id
+ 8)));
2598 pr_debug("registering session %s\n", ch
->sess_name
);
2600 nacl
= srpt_lookup_acl(sport
, ch
->i_port_id
);
2602 printk(KERN_INFO
"Rejected login because no ACL has been"
2603 " configured yet for initiator %s.\n", ch
->sess_name
);
2604 rej
->reason
= __constant_cpu_to_be32(
2605 SRP_LOGIN_REJ_CHANNEL_LIMIT_REACHED
);
2609 ch
->sess
= transport_init_session();
2610 if (IS_ERR(ch
->sess
)) {
2611 rej
->reason
= __constant_cpu_to_be32(
2612 SRP_LOGIN_REJ_INSUFFICIENT_RESOURCES
);
2613 pr_debug("Failed to create session\n");
2614 goto deregister_session
;
2616 ch
->sess
->se_node_acl
= &nacl
->nacl
;
2617 transport_register_session(&sport
->port_tpg_1
, &nacl
->nacl
, ch
->sess
, ch
);
2619 pr_debug("Establish connection sess=%p name=%s cm_id=%p\n", ch
->sess
,
2620 ch
->sess_name
, ch
->cm_id
);
2622 /* create srp_login_response */
2623 rsp
->opcode
= SRP_LOGIN_RSP
;
2624 rsp
->tag
= req
->tag
;
2625 rsp
->max_it_iu_len
= req
->req_it_iu_len
;
2626 rsp
->max_ti_iu_len
= req
->req_it_iu_len
;
2627 ch
->max_ti_iu_len
= it_iu_len
;
2628 rsp
->buf_fmt
= __constant_cpu_to_be16(SRP_BUF_FORMAT_DIRECT
2629 | SRP_BUF_FORMAT_INDIRECT
);
2630 rsp
->req_lim_delta
= cpu_to_be32(ch
->rq_size
);
2631 atomic_set(&ch
->req_lim
, ch
->rq_size
);
2632 atomic_set(&ch
->req_lim_delta
, 0);
2634 /* create cm reply */
2635 rep_param
->qp_num
= ch
->qp
->qp_num
;
2636 rep_param
->private_data
= (void *)rsp
;
2637 rep_param
->private_data_len
= sizeof *rsp
;
2638 rep_param
->rnr_retry_count
= 7;
2639 rep_param
->flow_control
= 1;
2640 rep_param
->failover_accepted
= 0;
2642 rep_param
->responder_resources
= 4;
2643 rep_param
->initiator_depth
= 4;
2645 ret
= ib_send_cm_rep(cm_id
, rep_param
);
2647 printk(KERN_ERR
"sending SRP_LOGIN_REQ response failed"
2648 " (error code = %d)\n", ret
);
2649 goto release_channel
;
2652 spin_lock_irq(&sdev
->spinlock
);
2653 list_add_tail(&ch
->list
, &sdev
->rch_list
);
2654 spin_unlock_irq(&sdev
->spinlock
);
2659 srpt_set_ch_state(ch
, CH_RELEASING
);
2660 transport_deregister_session_configfs(ch
->sess
);
2663 transport_deregister_session(ch
->sess
);
2667 srpt_destroy_ch_ib(ch
);
2670 srpt_free_ioctx_ring((struct srpt_ioctx
**)ch
->ioctx_ring
,
2671 ch
->sport
->sdev
, ch
->rq_size
,
2672 ch
->rsp_size
, DMA_TO_DEVICE
);
2677 rej
->opcode
= SRP_LOGIN_REJ
;
2678 rej
->tag
= req
->tag
;
2679 rej
->buf_fmt
= __constant_cpu_to_be16(SRP_BUF_FORMAT_DIRECT
2680 | SRP_BUF_FORMAT_INDIRECT
);
2682 ib_send_cm_rej(cm_id
, IB_CM_REJ_CONSUMER_DEFINED
, NULL
, 0,
2683 (void *)rej
, sizeof *rej
);
2693 static void srpt_cm_rej_recv(struct ib_cm_id
*cm_id
)
2695 printk(KERN_INFO
"Received IB REJ for cm_id %p.\n", cm_id
);
2696 srpt_drain_channel(cm_id
);
2700 * srpt_cm_rtu_recv() - Process an IB_CM_RTU_RECEIVED or USER_ESTABLISHED event.
2702 * An IB_CM_RTU_RECEIVED message indicates that the connection is established
2703 * and that the recipient may begin transmitting (RTU = ready to use).
2705 static void srpt_cm_rtu_recv(struct ib_cm_id
*cm_id
)
2707 struct srpt_rdma_ch
*ch
;
2710 ch
= srpt_find_channel(cm_id
->context
, cm_id
);
2713 if (srpt_test_and_set_ch_state(ch
, CH_CONNECTING
, CH_LIVE
)) {
2714 struct srpt_recv_ioctx
*ioctx
, *ioctx_tmp
;
2716 ret
= srpt_ch_qp_rts(ch
, ch
->qp
);
2718 list_for_each_entry_safe(ioctx
, ioctx_tmp
, &ch
->cmd_wait_list
,
2720 list_del(&ioctx
->wait_list
);
2721 srpt_handle_new_iu(ch
, ioctx
, NULL
);
2728 static void srpt_cm_timewait_exit(struct ib_cm_id
*cm_id
)
2730 printk(KERN_INFO
"Received IB TimeWait exit for cm_id %p.\n", cm_id
);
2731 srpt_drain_channel(cm_id
);
2734 static void srpt_cm_rep_error(struct ib_cm_id
*cm_id
)
2736 printk(KERN_INFO
"Received IB REP error for cm_id %p.\n", cm_id
);
2737 srpt_drain_channel(cm_id
);
2741 * srpt_cm_dreq_recv() - Process reception of a DREQ message.
2743 static void srpt_cm_dreq_recv(struct ib_cm_id
*cm_id
)
2745 struct srpt_rdma_ch
*ch
;
2746 unsigned long flags
;
2747 bool send_drep
= false;
2749 ch
= srpt_find_channel(cm_id
->context
, cm_id
);
2752 pr_debug("cm_id= %p ch->state= %d\n", cm_id
, srpt_get_ch_state(ch
));
2754 spin_lock_irqsave(&ch
->spinlock
, flags
);
2755 switch (ch
->state
) {
2759 ch
->state
= CH_DISCONNECTING
;
2761 case CH_DISCONNECTING
:
2764 WARN(true, "unexpected channel state %d\n", ch
->state
);
2767 spin_unlock_irqrestore(&ch
->spinlock
, flags
);
2770 if (ib_send_cm_drep(ch
->cm_id
, NULL
, 0) < 0)
2771 printk(KERN_ERR
"Sending IB DREP failed.\n");
2772 printk(KERN_INFO
"Received DREQ and sent DREP for session %s.\n",
2778 * srpt_cm_drep_recv() - Process reception of a DREP message.
2780 static void srpt_cm_drep_recv(struct ib_cm_id
*cm_id
)
2782 printk(KERN_INFO
"Received InfiniBand DREP message for cm_id %p.\n",
2784 srpt_drain_channel(cm_id
);
2788 * srpt_cm_handler() - IB connection manager callback function.
2790 * A non-zero return value will cause the caller destroy the CM ID.
2792 * Note: srpt_cm_handler() must only return a non-zero value when transferring
2793 * ownership of the cm_id to a channel by srpt_cm_req_recv() failed. Returning
2794 * a non-zero value in any other case will trigger a race with the
2795 * ib_destroy_cm_id() call in srpt_release_channel().
2797 static int srpt_cm_handler(struct ib_cm_id
*cm_id
, struct ib_cm_event
*event
)
2802 switch (event
->event
) {
2803 case IB_CM_REQ_RECEIVED
:
2804 ret
= srpt_cm_req_recv(cm_id
, &event
->param
.req_rcvd
,
2805 event
->private_data
);
2807 case IB_CM_REJ_RECEIVED
:
2808 srpt_cm_rej_recv(cm_id
);
2810 case IB_CM_RTU_RECEIVED
:
2811 case IB_CM_USER_ESTABLISHED
:
2812 srpt_cm_rtu_recv(cm_id
);
2814 case IB_CM_DREQ_RECEIVED
:
2815 srpt_cm_dreq_recv(cm_id
);
2817 case IB_CM_DREP_RECEIVED
:
2818 srpt_cm_drep_recv(cm_id
);
2820 case IB_CM_TIMEWAIT_EXIT
:
2821 srpt_cm_timewait_exit(cm_id
);
2823 case IB_CM_REP_ERROR
:
2824 srpt_cm_rep_error(cm_id
);
2826 case IB_CM_DREQ_ERROR
:
2827 printk(KERN_INFO
"Received IB DREQ ERROR event.\n");
2829 case IB_CM_MRA_RECEIVED
:
2830 printk(KERN_INFO
"Received IB MRA event\n");
2833 printk(KERN_ERR
"received unrecognized IB CM event %d\n",
2842 * srpt_perform_rdmas() - Perform IB RDMA.
2844 * Returns zero upon success or a negative number upon failure.
2846 static int srpt_perform_rdmas(struct srpt_rdma_ch
*ch
,
2847 struct srpt_send_ioctx
*ioctx
)
2849 struct ib_send_wr wr
;
2850 struct ib_send_wr
*bad_wr
;
2851 struct rdma_iu
*riu
;
2855 enum dma_data_direction dir
;
2856 const int n_rdma
= ioctx
->n_rdma
;
2858 dir
= ioctx
->cmd
.data_direction
;
2859 if (dir
== DMA_TO_DEVICE
) {
2862 sq_wr_avail
= atomic_sub_return(n_rdma
, &ch
->sq_wr_avail
);
2863 if (sq_wr_avail
< 0) {
2864 printk(KERN_WARNING
"IB send queue full (needed %d)\n",
2870 ioctx
->rdma_aborted
= false;
2872 riu
= ioctx
->rdma_ius
;
2873 memset(&wr
, 0, sizeof wr
);
2875 for (i
= 0; i
< n_rdma
; ++i
, ++riu
) {
2876 if (dir
== DMA_FROM_DEVICE
) {
2877 wr
.opcode
= IB_WR_RDMA_WRITE
;
2878 wr
.wr_id
= encode_wr_id(i
== n_rdma
- 1 ?
2879 SRPT_RDMA_WRITE_LAST
:
2881 ioctx
->ioctx
.index
);
2883 wr
.opcode
= IB_WR_RDMA_READ
;
2884 wr
.wr_id
= encode_wr_id(i
== n_rdma
- 1 ?
2885 SRPT_RDMA_READ_LAST
:
2887 ioctx
->ioctx
.index
);
2890 wr
.wr
.rdma
.remote_addr
= riu
->raddr
;
2891 wr
.wr
.rdma
.rkey
= riu
->rkey
;
2892 wr
.num_sge
= riu
->sge_cnt
;
2893 wr
.sg_list
= riu
->sge
;
2895 /* only get completion event for the last rdma write */
2896 if (i
== (n_rdma
- 1) && dir
== DMA_TO_DEVICE
)
2897 wr
.send_flags
= IB_SEND_SIGNALED
;
2899 ret
= ib_post_send(ch
->qp
, &wr
, &bad_wr
);
2905 printk(KERN_ERR
"%s[%d]: ib_post_send() returned %d for %d/%d",
2906 __func__
, __LINE__
, ret
, i
, n_rdma
);
2909 wr
.wr_id
= encode_wr_id(SRPT_RDMA_ABORT
, ioctx
->ioctx
.index
);
2910 wr
.send_flags
= IB_SEND_SIGNALED
;
2911 while (ch
->state
== CH_LIVE
&&
2912 ib_post_send(ch
->qp
, &wr
, &bad_wr
) != 0) {
2913 printk(KERN_INFO
"Trying to abort failed RDMA transfer [%d]",
2914 ioctx
->ioctx
.index
);
2917 while (ch
->state
!= CH_RELEASING
&& !ioctx
->rdma_aborted
) {
2918 printk(KERN_INFO
"Waiting until RDMA abort finished [%d]",
2919 ioctx
->ioctx
.index
);
2924 if (unlikely(dir
== DMA_TO_DEVICE
&& ret
< 0))
2925 atomic_add(n_rdma
, &ch
->sq_wr_avail
);
2930 * srpt_xfer_data() - Start data transfer from initiator to target.
2932 static int srpt_xfer_data(struct srpt_rdma_ch
*ch
,
2933 struct srpt_send_ioctx
*ioctx
)
2937 ret
= srpt_map_sg_to_ib_sge(ch
, ioctx
);
2939 printk(KERN_ERR
"%s[%d] ret=%d\n", __func__
, __LINE__
, ret
);
2943 ret
= srpt_perform_rdmas(ch
, ioctx
);
2945 if (ret
== -EAGAIN
|| ret
== -ENOMEM
)
2946 printk(KERN_INFO
"%s[%d] queue full -- ret=%d\n",
2947 __func__
, __LINE__
, ret
);
2949 printk(KERN_ERR
"%s[%d] fatal error -- ret=%d\n",
2950 __func__
, __LINE__
, ret
);
2957 srpt_unmap_sg_to_ib_sge(ch
, ioctx
);
2961 static int srpt_write_pending_status(struct se_cmd
*se_cmd
)
2963 struct srpt_send_ioctx
*ioctx
;
2965 ioctx
= container_of(se_cmd
, struct srpt_send_ioctx
, cmd
);
2966 return srpt_get_cmd_state(ioctx
) == SRPT_STATE_NEED_DATA
;
2970 * srpt_write_pending() - Start data transfer from initiator to target (write).
2972 static int srpt_write_pending(struct se_cmd
*se_cmd
)
2974 struct srpt_rdma_ch
*ch
;
2975 struct srpt_send_ioctx
*ioctx
;
2976 enum srpt_command_state new_state
;
2977 enum rdma_ch_state ch_state
;
2980 ioctx
= container_of(se_cmd
, struct srpt_send_ioctx
, cmd
);
2982 new_state
= srpt_set_cmd_state(ioctx
, SRPT_STATE_NEED_DATA
);
2983 WARN_ON(new_state
== SRPT_STATE_DONE
);
2988 ch_state
= srpt_get_ch_state(ch
);
2991 WARN(true, "unexpected channel state %d\n", ch_state
);
2996 case CH_DISCONNECTING
:
2999 pr_debug("cmd with tag %lld: channel disconnecting\n",
3001 srpt_set_cmd_state(ioctx
, SRPT_STATE_DATA_IN
);
3005 ret
= srpt_xfer_data(ch
, ioctx
);
3011 static u8
tcm_to_srp_tsk_mgmt_status(const int tcm_mgmt_status
)
3013 switch (tcm_mgmt_status
) {
3014 case TMR_FUNCTION_COMPLETE
:
3015 return SRP_TSK_MGMT_SUCCESS
;
3016 case TMR_FUNCTION_REJECTED
:
3017 return SRP_TSK_MGMT_FUNC_NOT_SUPP
;
3019 return SRP_TSK_MGMT_FAILED
;
3023 * srpt_queue_response() - Transmits the response to a SCSI command.
3025 * Callback function called by the TCM core. Must not block since it can be
3026 * invoked on the context of the IB completion handler.
3028 static int srpt_queue_response(struct se_cmd
*cmd
)
3030 struct srpt_rdma_ch
*ch
;
3031 struct srpt_send_ioctx
*ioctx
;
3032 enum srpt_command_state state
;
3033 unsigned long flags
;
3035 enum dma_data_direction dir
;
3041 ioctx
= container_of(cmd
, struct srpt_send_ioctx
, cmd
);
3045 spin_lock_irqsave(&ioctx
->spinlock
, flags
);
3046 state
= ioctx
->state
;
3048 case SRPT_STATE_NEW
:
3049 case SRPT_STATE_DATA_IN
:
3050 ioctx
->state
= SRPT_STATE_CMD_RSP_SENT
;
3052 case SRPT_STATE_MGMT
:
3053 ioctx
->state
= SRPT_STATE_MGMT_RSP_SENT
;
3056 WARN(true, "ch %p; cmd %d: unexpected command state %d\n",
3057 ch
, ioctx
->ioctx
.index
, ioctx
->state
);
3060 spin_unlock_irqrestore(&ioctx
->spinlock
, flags
);
3062 if (unlikely(transport_check_aborted_status(&ioctx
->cmd
, false)
3063 || WARN_ON_ONCE(state
== SRPT_STATE_CMD_RSP_SENT
))) {
3064 atomic_inc(&ch
->req_lim_delta
);
3065 srpt_abort_cmd(ioctx
);
3069 dir
= ioctx
->cmd
.data_direction
;
3071 /* For read commands, transfer the data to the initiator. */
3072 if (dir
== DMA_FROM_DEVICE
&& ioctx
->cmd
.data_length
&&
3073 !ioctx
->queue_status_only
) {
3074 ret
= srpt_xfer_data(ch
, ioctx
);
3076 printk(KERN_ERR
"xfer_data failed for tag %llu\n",
3082 if (state
!= SRPT_STATE_MGMT
)
3083 resp_len
= srpt_build_cmd_rsp(ch
, ioctx
, ioctx
->tag
,
3087 = tcm_to_srp_tsk_mgmt_status(cmd
->se_tmr_req
->response
);
3088 resp_len
= srpt_build_tskmgmt_rsp(ch
, ioctx
, srp_tm_status
,
3091 ret
= srpt_post_send(ch
, ioctx
, resp_len
);
3093 printk(KERN_ERR
"sending cmd response failed for tag %llu\n",
3095 srpt_unmap_sg_to_ib_sge(ch
, ioctx
);
3096 srpt_set_cmd_state(ioctx
, SRPT_STATE_DONE
);
3097 kref_put(&ioctx
->kref
, srpt_put_send_ioctx_kref
);
3104 static int srpt_queue_status(struct se_cmd
*cmd
)
3106 struct srpt_send_ioctx
*ioctx
;
3108 ioctx
= container_of(cmd
, struct srpt_send_ioctx
, cmd
);
3109 BUG_ON(ioctx
->sense_data
!= cmd
->sense_buffer
);
3110 if (cmd
->se_cmd_flags
&
3111 (SCF_TRANSPORT_TASK_SENSE
| SCF_EMULATED_TASK_SENSE
))
3112 WARN_ON(cmd
->scsi_status
!= SAM_STAT_CHECK_CONDITION
);
3113 ioctx
->queue_status_only
= true;
3114 return srpt_queue_response(cmd
);
3117 static void srpt_refresh_port_work(struct work_struct
*work
)
3119 struct srpt_port
*sport
= container_of(work
, struct srpt_port
, work
);
3121 srpt_refresh_port(sport
);
3124 static int srpt_ch_list_empty(struct srpt_device
*sdev
)
3128 spin_lock_irq(&sdev
->spinlock
);
3129 res
= list_empty(&sdev
->rch_list
);
3130 spin_unlock_irq(&sdev
->spinlock
);
3136 * srpt_release_sdev() - Free the channel resources associated with a target.
3138 static int srpt_release_sdev(struct srpt_device
*sdev
)
3140 struct srpt_rdma_ch
*ch
, *tmp_ch
;
3143 WARN_ON_ONCE(irqs_disabled());
3147 spin_lock_irq(&sdev
->spinlock
);
3148 list_for_each_entry_safe(ch
, tmp_ch
, &sdev
->rch_list
, list
)
3149 __srpt_close_ch(ch
);
3150 spin_unlock_irq(&sdev
->spinlock
);
3152 res
= wait_event_interruptible(sdev
->ch_releaseQ
,
3153 srpt_ch_list_empty(sdev
));
3155 printk(KERN_ERR
"%s: interrupted.\n", __func__
);
3160 static struct srpt_port
*__srpt_lookup_port(const char *name
)
3162 struct ib_device
*dev
;
3163 struct srpt_device
*sdev
;
3164 struct srpt_port
*sport
;
3167 list_for_each_entry(sdev
, &srpt_dev_list
, list
) {
3172 for (i
= 0; i
< dev
->phys_port_cnt
; i
++) {
3173 sport
= &sdev
->port
[i
];
3175 if (!strcmp(sport
->port_guid
, name
))
3183 static struct srpt_port
*srpt_lookup_port(const char *name
)
3185 struct srpt_port
*sport
;
3187 spin_lock(&srpt_dev_lock
);
3188 sport
= __srpt_lookup_port(name
);
3189 spin_unlock(&srpt_dev_lock
);
3195 * srpt_add_one() - Infiniband device addition callback function.
3197 static void srpt_add_one(struct ib_device
*device
)
3199 struct srpt_device
*sdev
;
3200 struct srpt_port
*sport
;
3201 struct ib_srq_init_attr srq_attr
;
3204 pr_debug("device = %p, device->dma_ops = %p\n", device
,
3207 sdev
= kzalloc(sizeof *sdev
, GFP_KERNEL
);
3211 sdev
->device
= device
;
3212 INIT_LIST_HEAD(&sdev
->rch_list
);
3213 init_waitqueue_head(&sdev
->ch_releaseQ
);
3214 spin_lock_init(&sdev
->spinlock
);
3216 if (ib_query_device(device
, &sdev
->dev_attr
))
3219 sdev
->pd
= ib_alloc_pd(device
);
3220 if (IS_ERR(sdev
->pd
))
3223 sdev
->mr
= ib_get_dma_mr(sdev
->pd
, IB_ACCESS_LOCAL_WRITE
);
3224 if (IS_ERR(sdev
->mr
))
3227 sdev
->srq_size
= min(srpt_srq_size
, sdev
->dev_attr
.max_srq_wr
);
3229 srq_attr
.event_handler
= srpt_srq_event
;
3230 srq_attr
.srq_context
= (void *)sdev
;
3231 srq_attr
.attr
.max_wr
= sdev
->srq_size
;
3232 srq_attr
.attr
.max_sge
= 1;
3233 srq_attr
.attr
.srq_limit
= 0;
3235 sdev
->srq
= ib_create_srq(sdev
->pd
, &srq_attr
);
3236 if (IS_ERR(sdev
->srq
))
3239 pr_debug("%s: create SRQ #wr= %d max_allow=%d dev= %s\n",
3240 __func__
, sdev
->srq_size
, sdev
->dev_attr
.max_srq_wr
,
3243 if (!srpt_service_guid
)
3244 srpt_service_guid
= be64_to_cpu(device
->node_guid
);
3246 sdev
->cm_id
= ib_create_cm_id(device
, srpt_cm_handler
, sdev
);
3247 if (IS_ERR(sdev
->cm_id
))
3250 /* print out target login information */
3251 pr_debug("Target login info: id_ext=%016llx,ioc_guid=%016llx,"
3252 "pkey=ffff,service_id=%016llx\n", srpt_service_guid
,
3253 srpt_service_guid
, srpt_service_guid
);
3256 * We do not have a consistent service_id (ie. also id_ext of target_id)
3257 * to identify this target. We currently use the guid of the first HCA
3258 * in the system as service_id; therefore, the target_id will change
3259 * if this HCA is gone bad and replaced by different HCA
3261 if (ib_cm_listen(sdev
->cm_id
, cpu_to_be64(srpt_service_guid
), 0, NULL
))
3264 INIT_IB_EVENT_HANDLER(&sdev
->event_handler
, sdev
->device
,
3265 srpt_event_handler
);
3266 if (ib_register_event_handler(&sdev
->event_handler
))
3269 sdev
->ioctx_ring
= (struct srpt_recv_ioctx
**)
3270 srpt_alloc_ioctx_ring(sdev
, sdev
->srq_size
,
3271 sizeof(*sdev
->ioctx_ring
[0]),
3272 srp_max_req_size
, DMA_FROM_DEVICE
);
3273 if (!sdev
->ioctx_ring
)
3276 for (i
= 0; i
< sdev
->srq_size
; ++i
)
3277 srpt_post_recv(sdev
, sdev
->ioctx_ring
[i
]);
3279 WARN_ON(sdev
->device
->phys_port_cnt
> ARRAY_SIZE(sdev
->port
));
3281 for (i
= 1; i
<= sdev
->device
->phys_port_cnt
; i
++) {
3282 sport
= &sdev
->port
[i
- 1];
3285 sport
->port_attrib
.srp_max_rdma_size
= DEFAULT_MAX_RDMA_SIZE
;
3286 sport
->port_attrib
.srp_max_rsp_size
= DEFAULT_MAX_RSP_SIZE
;
3287 sport
->port_attrib
.srp_sq_size
= DEF_SRPT_SQ_SIZE
;
3288 INIT_WORK(&sport
->work
, srpt_refresh_port_work
);
3289 INIT_LIST_HEAD(&sport
->port_acl_list
);
3290 spin_lock_init(&sport
->port_acl_lock
);
3292 if (srpt_refresh_port(sport
)) {
3293 printk(KERN_ERR
"MAD registration failed for %s-%d.\n",
3294 srpt_sdev_name(sdev
), i
);
3297 snprintf(sport
->port_guid
, sizeof(sport
->port_guid
),
3299 be64_to_cpu(sport
->gid
.global
.subnet_prefix
),
3300 be64_to_cpu(sport
->gid
.global
.interface_id
));
3303 spin_lock(&srpt_dev_lock
);
3304 list_add_tail(&sdev
->list
, &srpt_dev_list
);
3305 spin_unlock(&srpt_dev_lock
);
3308 ib_set_client_data(device
, &srpt_client
, sdev
);
3309 pr_debug("added %s.\n", device
->name
);
3313 srpt_free_ioctx_ring((struct srpt_ioctx
**)sdev
->ioctx_ring
, sdev
,
3314 sdev
->srq_size
, srp_max_req_size
,
3317 ib_unregister_event_handler(&sdev
->event_handler
);
3319 ib_destroy_cm_id(sdev
->cm_id
);
3321 ib_destroy_srq(sdev
->srq
);
3323 ib_dereg_mr(sdev
->mr
);
3325 ib_dealloc_pd(sdev
->pd
);
3330 printk(KERN_INFO
"%s(%s) failed.\n", __func__
, device
->name
);
3335 * srpt_remove_one() - InfiniBand device removal callback function.
3337 static void srpt_remove_one(struct ib_device
*device
)
3339 struct srpt_device
*sdev
;
3342 sdev
= ib_get_client_data(device
, &srpt_client
);
3344 printk(KERN_INFO
"%s(%s): nothing to do.\n", __func__
,
3349 srpt_unregister_mad_agent(sdev
);
3351 ib_unregister_event_handler(&sdev
->event_handler
);
3353 /* Cancel any work queued by the just unregistered IB event handler. */
3354 for (i
= 0; i
< sdev
->device
->phys_port_cnt
; i
++)
3355 cancel_work_sync(&sdev
->port
[i
].work
);
3357 ib_destroy_cm_id(sdev
->cm_id
);
3360 * Unregistering a target must happen after destroying sdev->cm_id
3361 * such that no new SRP_LOGIN_REQ information units can arrive while
3362 * destroying the target.
3364 spin_lock(&srpt_dev_lock
);
3365 list_del(&sdev
->list
);
3366 spin_unlock(&srpt_dev_lock
);
3367 srpt_release_sdev(sdev
);
3369 ib_destroy_srq(sdev
->srq
);
3370 ib_dereg_mr(sdev
->mr
);
3371 ib_dealloc_pd(sdev
->pd
);
3373 srpt_free_ioctx_ring((struct srpt_ioctx
**)sdev
->ioctx_ring
, sdev
,
3374 sdev
->srq_size
, srp_max_req_size
, DMA_FROM_DEVICE
);
3375 sdev
->ioctx_ring
= NULL
;
3379 static struct ib_client srpt_client
= {
3381 .add
= srpt_add_one
,
3382 .remove
= srpt_remove_one
3385 static int srpt_check_true(struct se_portal_group
*se_tpg
)
3390 static int srpt_check_false(struct se_portal_group
*se_tpg
)
3395 static char *srpt_get_fabric_name(void)
3400 static u8
srpt_get_fabric_proto_ident(struct se_portal_group
*se_tpg
)
3402 return SCSI_TRANSPORTID_PROTOCOLID_SRP
;
3405 static char *srpt_get_fabric_wwn(struct se_portal_group
*tpg
)
3407 struct srpt_port
*sport
= container_of(tpg
, struct srpt_port
, port_tpg_1
);
3409 return sport
->port_guid
;
3412 static u16
srpt_get_tag(struct se_portal_group
*tpg
)
3417 static u32
srpt_get_default_depth(struct se_portal_group
*se_tpg
)
3422 static u32
srpt_get_pr_transport_id(struct se_portal_group
*se_tpg
,
3423 struct se_node_acl
*se_nacl
,
3424 struct t10_pr_registration
*pr_reg
,
3425 int *format_code
, unsigned char *buf
)
3427 struct srpt_node_acl
*nacl
;
3428 struct spc_rdma_transport_id
*tr_id
;
3430 nacl
= container_of(se_nacl
, struct srpt_node_acl
, nacl
);
3431 tr_id
= (void *)buf
;
3432 tr_id
->protocol_identifier
= SCSI_TRANSPORTID_PROTOCOLID_SRP
;
3433 memcpy(tr_id
->i_port_id
, nacl
->i_port_id
, sizeof(tr_id
->i_port_id
));
3434 return sizeof(*tr_id
);
3437 static u32
srpt_get_pr_transport_id_len(struct se_portal_group
*se_tpg
,
3438 struct se_node_acl
*se_nacl
,
3439 struct t10_pr_registration
*pr_reg
,
3443 return sizeof(struct spc_rdma_transport_id
);
3446 static char *srpt_parse_pr_out_transport_id(struct se_portal_group
*se_tpg
,
3447 const char *buf
, u32
*out_tid_len
,
3448 char **port_nexus_ptr
)
3450 struct spc_rdma_transport_id
*tr_id
;
3452 *port_nexus_ptr
= NULL
;
3453 *out_tid_len
= sizeof(struct spc_rdma_transport_id
);
3454 tr_id
= (void *)buf
;
3455 return (char *)tr_id
->i_port_id
;
3458 static struct se_node_acl
*srpt_alloc_fabric_acl(struct se_portal_group
*se_tpg
)
3460 struct srpt_node_acl
*nacl
;
3462 nacl
= kzalloc(sizeof(struct srpt_node_acl
), GFP_KERNEL
);
3464 printk(KERN_ERR
"Unable to allocate struct srpt_node_acl\n");
3471 static void srpt_release_fabric_acl(struct se_portal_group
*se_tpg
,
3472 struct se_node_acl
*se_nacl
)
3474 struct srpt_node_acl
*nacl
;
3476 nacl
= container_of(se_nacl
, struct srpt_node_acl
, nacl
);
3480 static u32
srpt_tpg_get_inst_index(struct se_portal_group
*se_tpg
)
3485 static void srpt_release_cmd(struct se_cmd
*se_cmd
)
3490 * srpt_shutdown_session() - Whether or not a session may be shut down.
3492 static int srpt_shutdown_session(struct se_session
*se_sess
)
3498 * srpt_close_session() - Forcibly close a session.
3500 * Callback function invoked by the TCM core to clean up sessions associated
3501 * with a node ACL when the user invokes
3502 * rmdir /sys/kernel/config/target/$driver/$port/$tpg/acls/$i_port_id
3504 static void srpt_close_session(struct se_session
*se_sess
)
3506 DECLARE_COMPLETION_ONSTACK(release_done
);
3507 struct srpt_rdma_ch
*ch
;
3508 struct srpt_device
*sdev
;
3511 ch
= se_sess
->fabric_sess_ptr
;
3512 WARN_ON(ch
->sess
!= se_sess
);
3514 pr_debug("ch %p state %d\n", ch
, srpt_get_ch_state(ch
));
3516 sdev
= ch
->sport
->sdev
;
3517 spin_lock_irq(&sdev
->spinlock
);
3518 BUG_ON(ch
->release_done
);
3519 ch
->release_done
= &release_done
;
3520 __srpt_close_ch(ch
);
3521 spin_unlock_irq(&sdev
->spinlock
);
3523 res
= wait_for_completion_timeout(&release_done
, 60 * HZ
);
3528 * srpt_sess_get_index() - Return the value of scsiAttIntrPortIndex (SCSI-MIB).
3530 * A quote from RFC 4455 (SCSI-MIB) about this MIB object:
3531 * This object represents an arbitrary integer used to uniquely identify a
3532 * particular attached remote initiator port to a particular SCSI target port
3533 * within a particular SCSI target device within a particular SCSI instance.
3535 static u32
srpt_sess_get_index(struct se_session
*se_sess
)
3540 static void srpt_set_default_node_attrs(struct se_node_acl
*nacl
)
3544 static u32
srpt_get_task_tag(struct se_cmd
*se_cmd
)
3546 struct srpt_send_ioctx
*ioctx
;
3548 ioctx
= container_of(se_cmd
, struct srpt_send_ioctx
, cmd
);
3552 /* Note: only used from inside debug printk's by the TCM core. */
3553 static int srpt_get_tcm_cmd_state(struct se_cmd
*se_cmd
)
3555 struct srpt_send_ioctx
*ioctx
;
3557 ioctx
= container_of(se_cmd
, struct srpt_send_ioctx
, cmd
);
3558 return srpt_get_cmd_state(ioctx
);
3561 static u16
srpt_set_fabric_sense_len(struct se_cmd
*cmd
, u32 sense_length
)
3566 static u16
srpt_get_fabric_sense_len(void)
3572 * srpt_parse_i_port_id() - Parse an initiator port ID.
3573 * @name: ASCII representation of a 128-bit initiator port ID.
3574 * @i_port_id: Binary 128-bit port ID.
3576 static int srpt_parse_i_port_id(u8 i_port_id
[16], const char *name
)
3579 unsigned len
, count
, leading_zero_bytes
;
3583 if (strnicmp(p
, "0x", 2) == 0)
3589 count
= min(len
/ 2, 16U);
3590 leading_zero_bytes
= 16 - count
;
3591 memset(i_port_id
, 0, leading_zero_bytes
);
3592 rc
= hex2bin(i_port_id
+ leading_zero_bytes
, p
, count
);
3594 pr_debug("hex2bin failed for srpt_parse_i_port_id: %d\n", rc
);
3601 * configfs callback function invoked for
3602 * mkdir /sys/kernel/config/target/$driver/$port/$tpg/acls/$i_port_id
3604 static struct se_node_acl
*srpt_make_nodeacl(struct se_portal_group
*tpg
,
3605 struct config_group
*group
,
3608 struct srpt_port
*sport
= container_of(tpg
, struct srpt_port
, port_tpg_1
);
3609 struct se_node_acl
*se_nacl
, *se_nacl_new
;
3610 struct srpt_node_acl
*nacl
;
3612 u32 nexus_depth
= 1;
3615 if (srpt_parse_i_port_id(i_port_id
, name
) < 0) {
3616 printk(KERN_ERR
"invalid initiator port ID %s\n", name
);
3621 se_nacl_new
= srpt_alloc_fabric_acl(tpg
);
3627 * nacl_new may be released by core_tpg_add_initiator_node_acl()
3628 * when converting a node ACL from demo mode to explict
3630 se_nacl
= core_tpg_add_initiator_node_acl(tpg
, se_nacl_new
, name
,
3632 if (IS_ERR(se_nacl
)) {
3633 ret
= PTR_ERR(se_nacl
);
3636 /* Locate our struct srpt_node_acl and set sdev and i_port_id. */
3637 nacl
= container_of(se_nacl
, struct srpt_node_acl
, nacl
);
3638 memcpy(&nacl
->i_port_id
[0], &i_port_id
[0], 16);
3639 nacl
->sport
= sport
;
3641 spin_lock_irq(&sport
->port_acl_lock
);
3642 list_add_tail(&nacl
->list
, &sport
->port_acl_list
);
3643 spin_unlock_irq(&sport
->port_acl_lock
);
3647 return ERR_PTR(ret
);
3651 * configfs callback function invoked for
3652 * rmdir /sys/kernel/config/target/$driver/$port/$tpg/acls/$i_port_id
3654 static void srpt_drop_nodeacl(struct se_node_acl
*se_nacl
)
3656 struct srpt_node_acl
*nacl
;
3657 struct srpt_device
*sdev
;
3658 struct srpt_port
*sport
;
3660 nacl
= container_of(se_nacl
, struct srpt_node_acl
, nacl
);
3661 sport
= nacl
->sport
;
3663 spin_lock_irq(&sport
->port_acl_lock
);
3664 list_del(&nacl
->list
);
3665 spin_unlock_irq(&sport
->port_acl_lock
);
3666 core_tpg_del_initiator_node_acl(&sport
->port_tpg_1
, se_nacl
, 1);
3667 srpt_release_fabric_acl(NULL
, se_nacl
);
3670 static ssize_t
srpt_tpg_attrib_show_srp_max_rdma_size(
3671 struct se_portal_group
*se_tpg
,
3674 struct srpt_port
*sport
= container_of(se_tpg
, struct srpt_port
, port_tpg_1
);
3676 return sprintf(page
, "%u\n", sport
->port_attrib
.srp_max_rdma_size
);
3679 static ssize_t
srpt_tpg_attrib_store_srp_max_rdma_size(
3680 struct se_portal_group
*se_tpg
,
3684 struct srpt_port
*sport
= container_of(se_tpg
, struct srpt_port
, port_tpg_1
);
3688 ret
= strict_strtoul(page
, 0, &val
);
3690 pr_err("strict_strtoul() failed with ret: %d\n", ret
);
3693 if (val
> MAX_SRPT_RDMA_SIZE
) {
3694 pr_err("val: %lu exceeds MAX_SRPT_RDMA_SIZE: %d\n", val
,
3695 MAX_SRPT_RDMA_SIZE
);
3698 if (val
< DEFAULT_MAX_RDMA_SIZE
) {
3699 pr_err("val: %lu smaller than DEFAULT_MAX_RDMA_SIZE: %d\n",
3700 val
, DEFAULT_MAX_RDMA_SIZE
);
3703 sport
->port_attrib
.srp_max_rdma_size
= val
;
3708 TF_TPG_ATTRIB_ATTR(srpt
, srp_max_rdma_size
, S_IRUGO
| S_IWUSR
);
3710 static ssize_t
srpt_tpg_attrib_show_srp_max_rsp_size(
3711 struct se_portal_group
*se_tpg
,
3714 struct srpt_port
*sport
= container_of(se_tpg
, struct srpt_port
, port_tpg_1
);
3716 return sprintf(page
, "%u\n", sport
->port_attrib
.srp_max_rsp_size
);
3719 static ssize_t
srpt_tpg_attrib_store_srp_max_rsp_size(
3720 struct se_portal_group
*se_tpg
,
3724 struct srpt_port
*sport
= container_of(se_tpg
, struct srpt_port
, port_tpg_1
);
3728 ret
= strict_strtoul(page
, 0, &val
);
3730 pr_err("strict_strtoul() failed with ret: %d\n", ret
);
3733 if (val
> MAX_SRPT_RSP_SIZE
) {
3734 pr_err("val: %lu exceeds MAX_SRPT_RSP_SIZE: %d\n", val
,
3738 if (val
< MIN_MAX_RSP_SIZE
) {
3739 pr_err("val: %lu smaller than MIN_MAX_RSP_SIZE: %d\n", val
,
3743 sport
->port_attrib
.srp_max_rsp_size
= val
;
3748 TF_TPG_ATTRIB_ATTR(srpt
, srp_max_rsp_size
, S_IRUGO
| S_IWUSR
);
3750 static ssize_t
srpt_tpg_attrib_show_srp_sq_size(
3751 struct se_portal_group
*se_tpg
,
3754 struct srpt_port
*sport
= container_of(se_tpg
, struct srpt_port
, port_tpg_1
);
3756 return sprintf(page
, "%u\n", sport
->port_attrib
.srp_sq_size
);
3759 static ssize_t
srpt_tpg_attrib_store_srp_sq_size(
3760 struct se_portal_group
*se_tpg
,
3764 struct srpt_port
*sport
= container_of(se_tpg
, struct srpt_port
, port_tpg_1
);
3768 ret
= strict_strtoul(page
, 0, &val
);
3770 pr_err("strict_strtoul() failed with ret: %d\n", ret
);
3773 if (val
> MAX_SRPT_SRQ_SIZE
) {
3774 pr_err("val: %lu exceeds MAX_SRPT_SRQ_SIZE: %d\n", val
,
3778 if (val
< MIN_SRPT_SRQ_SIZE
) {
3779 pr_err("val: %lu smaller than MIN_SRPT_SRQ_SIZE: %d\n", val
,
3783 sport
->port_attrib
.srp_sq_size
= val
;
3788 TF_TPG_ATTRIB_ATTR(srpt
, srp_sq_size
, S_IRUGO
| S_IWUSR
);
3790 static struct configfs_attribute
*srpt_tpg_attrib_attrs
[] = {
3791 &srpt_tpg_attrib_srp_max_rdma_size
.attr
,
3792 &srpt_tpg_attrib_srp_max_rsp_size
.attr
,
3793 &srpt_tpg_attrib_srp_sq_size
.attr
,
3797 static ssize_t
srpt_tpg_show_enable(
3798 struct se_portal_group
*se_tpg
,
3801 struct srpt_port
*sport
= container_of(se_tpg
, struct srpt_port
, port_tpg_1
);
3803 return snprintf(page
, PAGE_SIZE
, "%d\n", (sport
->enabled
) ? 1: 0);
3806 static ssize_t
srpt_tpg_store_enable(
3807 struct se_portal_group
*se_tpg
,
3811 struct srpt_port
*sport
= container_of(se_tpg
, struct srpt_port
, port_tpg_1
);
3815 ret
= strict_strtoul(page
, 0, &tmp
);
3817 printk(KERN_ERR
"Unable to extract srpt_tpg_store_enable\n");
3821 if ((tmp
!= 0) && (tmp
!= 1)) {
3822 printk(KERN_ERR
"Illegal value for srpt_tpg_store_enable: %lu\n", tmp
);
3826 sport
->enabled
= true;
3828 sport
->enabled
= false;
3833 TF_TPG_BASE_ATTR(srpt
, enable
, S_IRUGO
| S_IWUSR
);
3835 static struct configfs_attribute
*srpt_tpg_attrs
[] = {
3836 &srpt_tpg_enable
.attr
,
3841 * configfs callback invoked for
3842 * mkdir /sys/kernel/config/target/$driver/$port/$tpg
3844 static struct se_portal_group
*srpt_make_tpg(struct se_wwn
*wwn
,
3845 struct config_group
*group
,
3848 struct srpt_port
*sport
= container_of(wwn
, struct srpt_port
, port_wwn
);
3851 /* Initialize sport->port_wwn and sport->port_tpg_1 */
3852 res
= core_tpg_register(&srpt_target
->tf_ops
, &sport
->port_wwn
,
3853 &sport
->port_tpg_1
, sport
, TRANSPORT_TPG_TYPE_NORMAL
);
3855 return ERR_PTR(res
);
3857 return &sport
->port_tpg_1
;
3861 * configfs callback invoked for
3862 * rmdir /sys/kernel/config/target/$driver/$port/$tpg
3864 static void srpt_drop_tpg(struct se_portal_group
*tpg
)
3866 struct srpt_port
*sport
= container_of(tpg
,
3867 struct srpt_port
, port_tpg_1
);
3869 sport
->enabled
= false;
3870 core_tpg_deregister(&sport
->port_tpg_1
);
3874 * configfs callback invoked for
3875 * mkdir /sys/kernel/config/target/$driver/$port
3877 static struct se_wwn
*srpt_make_tport(struct target_fabric_configfs
*tf
,
3878 struct config_group
*group
,
3881 struct srpt_port
*sport
;
3884 sport
= srpt_lookup_port(name
);
3885 pr_debug("make_tport(%s)\n", name
);
3890 return &sport
->port_wwn
;
3893 return ERR_PTR(ret
);
3897 * configfs callback invoked for
3898 * rmdir /sys/kernel/config/target/$driver/$port
3900 static void srpt_drop_tport(struct se_wwn
*wwn
)
3902 struct srpt_port
*sport
= container_of(wwn
, struct srpt_port
, port_wwn
);
3904 pr_debug("drop_tport(%s\n", config_item_name(&sport
->port_wwn
.wwn_group
.cg_item
));
3907 static ssize_t
srpt_wwn_show_attr_version(struct target_fabric_configfs
*tf
,
3910 return scnprintf(buf
, PAGE_SIZE
, "%s\n", DRV_VERSION
);
3913 TF_WWN_ATTR_RO(srpt
, version
);
3915 static struct configfs_attribute
*srpt_wwn_attrs
[] = {
3916 &srpt_wwn_version
.attr
,
3920 static struct target_core_fabric_ops srpt_template
= {
3921 .get_fabric_name
= srpt_get_fabric_name
,
3922 .get_fabric_proto_ident
= srpt_get_fabric_proto_ident
,
3923 .tpg_get_wwn
= srpt_get_fabric_wwn
,
3924 .tpg_get_tag
= srpt_get_tag
,
3925 .tpg_get_default_depth
= srpt_get_default_depth
,
3926 .tpg_get_pr_transport_id
= srpt_get_pr_transport_id
,
3927 .tpg_get_pr_transport_id_len
= srpt_get_pr_transport_id_len
,
3928 .tpg_parse_pr_out_transport_id
= srpt_parse_pr_out_transport_id
,
3929 .tpg_check_demo_mode
= srpt_check_false
,
3930 .tpg_check_demo_mode_cache
= srpt_check_true
,
3931 .tpg_check_demo_mode_write_protect
= srpt_check_true
,
3932 .tpg_check_prod_mode_write_protect
= srpt_check_false
,
3933 .tpg_alloc_fabric_acl
= srpt_alloc_fabric_acl
,
3934 .tpg_release_fabric_acl
= srpt_release_fabric_acl
,
3935 .tpg_get_inst_index
= srpt_tpg_get_inst_index
,
3936 .release_cmd
= srpt_release_cmd
,
3937 .check_stop_free
= srpt_check_stop_free
,
3938 .shutdown_session
= srpt_shutdown_session
,
3939 .close_session
= srpt_close_session
,
3940 .sess_get_index
= srpt_sess_get_index
,
3941 .sess_get_initiator_sid
= NULL
,
3942 .write_pending
= srpt_write_pending
,
3943 .write_pending_status
= srpt_write_pending_status
,
3944 .set_default_node_attributes
= srpt_set_default_node_attrs
,
3945 .get_task_tag
= srpt_get_task_tag
,
3946 .get_cmd_state
= srpt_get_tcm_cmd_state
,
3947 .queue_data_in
= srpt_queue_response
,
3948 .queue_status
= srpt_queue_status
,
3949 .queue_tm_rsp
= srpt_queue_response
,
3950 .get_fabric_sense_len
= srpt_get_fabric_sense_len
,
3951 .set_fabric_sense_len
= srpt_set_fabric_sense_len
,
3953 * Setup function pointers for generic logic in
3954 * target_core_fabric_configfs.c
3956 .fabric_make_wwn
= srpt_make_tport
,
3957 .fabric_drop_wwn
= srpt_drop_tport
,
3958 .fabric_make_tpg
= srpt_make_tpg
,
3959 .fabric_drop_tpg
= srpt_drop_tpg
,
3960 .fabric_post_link
= NULL
,
3961 .fabric_pre_unlink
= NULL
,
3962 .fabric_make_np
= NULL
,
3963 .fabric_drop_np
= NULL
,
3964 .fabric_make_nodeacl
= srpt_make_nodeacl
,
3965 .fabric_drop_nodeacl
= srpt_drop_nodeacl
,
3969 * srpt_init_module() - Kernel module initialization.
3971 * Note: Since ib_register_client() registers callback functions, and since at
3972 * least one of these callback functions (srpt_add_one()) calls target core
3973 * functions, this driver must be registered with the target core before
3974 * ib_register_client() is called.
3976 static int __init
srpt_init_module(void)
3981 if (srp_max_req_size
< MIN_MAX_REQ_SIZE
) {
3982 printk(KERN_ERR
"invalid value %d for kernel module parameter"
3983 " srp_max_req_size -- must be at least %d.\n",
3984 srp_max_req_size
, MIN_MAX_REQ_SIZE
);
3988 if (srpt_srq_size
< MIN_SRPT_SRQ_SIZE
3989 || srpt_srq_size
> MAX_SRPT_SRQ_SIZE
) {
3990 printk(KERN_ERR
"invalid value %d for kernel module parameter"
3991 " srpt_srq_size -- must be in the range [%d..%d].\n",
3992 srpt_srq_size
, MIN_SRPT_SRQ_SIZE
, MAX_SRPT_SRQ_SIZE
);
3996 srpt_target
= target_fabric_configfs_init(THIS_MODULE
, "srpt");
3997 if (IS_ERR(srpt_target
)) {
3998 printk(KERN_ERR
"couldn't register\n");
3999 ret
= PTR_ERR(srpt_target
);
4003 srpt_target
->tf_ops
= srpt_template
;
4006 * Set up default attribute lists.
4008 srpt_target
->tf_cit_tmpl
.tfc_wwn_cit
.ct_attrs
= srpt_wwn_attrs
;
4009 srpt_target
->tf_cit_tmpl
.tfc_tpg_base_cit
.ct_attrs
= srpt_tpg_attrs
;
4010 srpt_target
->tf_cit_tmpl
.tfc_tpg_attrib_cit
.ct_attrs
= srpt_tpg_attrib_attrs
;
4011 srpt_target
->tf_cit_tmpl
.tfc_tpg_param_cit
.ct_attrs
= NULL
;
4012 srpt_target
->tf_cit_tmpl
.tfc_tpg_np_base_cit
.ct_attrs
= NULL
;
4013 srpt_target
->tf_cit_tmpl
.tfc_tpg_nacl_base_cit
.ct_attrs
= NULL
;
4014 srpt_target
->tf_cit_tmpl
.tfc_tpg_nacl_attrib_cit
.ct_attrs
= NULL
;
4015 srpt_target
->tf_cit_tmpl
.tfc_tpg_nacl_auth_cit
.ct_attrs
= NULL
;
4016 srpt_target
->tf_cit_tmpl
.tfc_tpg_nacl_param_cit
.ct_attrs
= NULL
;
4018 ret
= target_fabric_configfs_register(srpt_target
);
4020 printk(KERN_ERR
"couldn't register\n");
4021 goto out_free_target
;
4024 ret
= ib_register_client(&srpt_client
);
4026 printk(KERN_ERR
"couldn't register IB client\n");
4027 goto out_unregister_target
;
4032 out_unregister_target
:
4033 target_fabric_configfs_deregister(srpt_target
);
4037 target_fabric_configfs_free(srpt_target
);
4042 static void __exit
srpt_cleanup_module(void)
4044 ib_unregister_client(&srpt_client
);
4045 target_fabric_configfs_deregister(srpt_target
);
4049 module_init(srpt_init_module
);
4050 module_exit(srpt_cleanup_module
);