blob: 18cf65f092e89f050592c28c699710ee15ebb459 [file] [log] [blame]
Or Gerlitz1cfa0a72006-05-11 10:02:46 +03001/*
2 * Copyright (c) 2004, 2005, 2006 Voltaire, Inc. All rights reserved.
3 * Copyright (c) 2005, 2006 Cisco Systems. All rights reserved.
4 *
5 * This software is available to you under a choice of one of two
6 * licenses. You may choose to be licensed under the terms of the GNU
7 * General Public License (GPL) Version 2, available from the file
8 * COPYING in the main directory of this source tree, or the
9 * OpenIB.org BSD license below:
10 *
11 * Redistribution and use in source and binary forms, with or
12 * without modification, are permitted provided that the following
13 * conditions are met:
14 *
15 * - Redistributions of source code must retain the above
16 * copyright notice, this list of conditions and the following
17 * disclaimer.
18 *
19 * - Redistributions in binary form must reproduce the above
20 * copyright notice, this list of conditions and the following
21 * disclaimer in the documentation and/or other materials
22 * provided with the distribution.
23 *
24 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
25 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
26 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
27 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
28 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
29 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
30 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
31 * SOFTWARE.
Or Gerlitz1cfa0a72006-05-11 10:02:46 +030032 */
Or Gerlitz1cfa0a72006-05-11 10:02:46 +030033#include <linux/kernel.h>
34#include <linux/module.h>
Or Gerlitz1cfa0a72006-05-11 10:02:46 +030035#include <linux/delay.h>
Or Gerlitz1cfa0a72006-05-11 10:02:46 +030036
37#include "iscsi_iser.h"
38
39#define ISCSI_ISER_MAX_CONN 8
Or Gerlitz78ad0a32010-02-08 13:19:21 +000040#define ISER_MAX_RX_CQ_LEN (ISER_QP_MAX_RECV_DTOS * ISCSI_ISER_MAX_CONN)
41#define ISER_MAX_TX_CQ_LEN (ISER_QP_MAX_REQ_DTOS * ISCSI_ISER_MAX_CONN)
Or Gerlitz1cfa0a72006-05-11 10:02:46 +030042
43static void iser_cq_tasklet_fn(unsigned long data);
44static void iser_cq_callback(struct ib_cq *cq, void *cq_context);
Or Gerlitz1cfa0a72006-05-11 10:02:46 +030045
46static void iser_cq_event_callback(struct ib_event *cause, void *context)
47{
48 iser_err("got cq event %d \n", cause->event);
49}
50
51static void iser_qp_event_callback(struct ib_event *cause, void *context)
52{
53 iser_err("got qp event %d\n",cause->event);
54}
55
56/**
57 * iser_create_device_ib_res - creates Protection Domain (PD), Completion
58 * Queue (CQ), DMA Memory Region (DMA MR) with the device associated with
59 * the adapator.
60 *
61 * returns 0 on success, -1 on failure
62 */
63static int iser_create_device_ib_res(struct iser_device *device)
64{
65 device->pd = ib_alloc_pd(device->ib_device);
66 if (IS_ERR(device->pd))
67 goto pd_err;
68
Or Gerlitz78ad0a32010-02-08 13:19:21 +000069 device->rx_cq = ib_create_cq(device->ib_device,
Or Gerlitz1cfa0a72006-05-11 10:02:46 +030070 iser_cq_callback,
71 iser_cq_event_callback,
72 (void *)device,
Or Gerlitz78ad0a32010-02-08 13:19:21 +000073 ISER_MAX_RX_CQ_LEN, 0);
74 if (IS_ERR(device->rx_cq))
75 goto rx_cq_err;
Or Gerlitz1cfa0a72006-05-11 10:02:46 +030076
Or Gerlitz78ad0a32010-02-08 13:19:21 +000077 device->tx_cq = ib_create_cq(device->ib_device,
78 NULL, iser_cq_event_callback,
79 (void *)device,
80 ISER_MAX_TX_CQ_LEN, 0);
81
82 if (IS_ERR(device->tx_cq))
83 goto tx_cq_err;
84
85 if (ib_req_notify_cq(device->rx_cq, IB_CQ_NEXT_COMP))
Or Gerlitz1cfa0a72006-05-11 10:02:46 +030086 goto cq_arm_err;
87
88 tasklet_init(&device->cq_tasklet,
89 iser_cq_tasklet_fn,
90 (unsigned long)device);
91
Erez Zilberd8111022006-09-11 12:26:33 +030092 device->mr = ib_get_dma_mr(device->pd, IB_ACCESS_LOCAL_WRITE |
93 IB_ACCESS_REMOTE_WRITE |
94 IB_ACCESS_REMOTE_READ);
Or Gerlitz1cfa0a72006-05-11 10:02:46 +030095 if (IS_ERR(device->mr))
96 goto dma_mr_err;
97
98 return 0;
99
100dma_mr_err:
101 tasklet_kill(&device->cq_tasklet);
102cq_arm_err:
Or Gerlitz78ad0a32010-02-08 13:19:21 +0000103 ib_destroy_cq(device->tx_cq);
104tx_cq_err:
105 ib_destroy_cq(device->rx_cq);
106rx_cq_err:
Or Gerlitz1cfa0a72006-05-11 10:02:46 +0300107 ib_dealloc_pd(device->pd);
108pd_err:
109 iser_err("failed to allocate an IB resource\n");
110 return -1;
111}
112
113/**
Oliver Pinter38dc7322008-01-25 14:15:32 -0800114 * iser_free_device_ib_res - destroy/dealloc/dereg the DMA MR,
Or Gerlitz1cfa0a72006-05-11 10:02:46 +0300115 * CQ and PD created with the device associated with the adapator.
116 */
117static void iser_free_device_ib_res(struct iser_device *device)
118{
119 BUG_ON(device->mr == NULL);
120
121 tasklet_kill(&device->cq_tasklet);
122
123 (void)ib_dereg_mr(device->mr);
Or Gerlitz78ad0a32010-02-08 13:19:21 +0000124 (void)ib_destroy_cq(device->tx_cq);
125 (void)ib_destroy_cq(device->rx_cq);
Or Gerlitz1cfa0a72006-05-11 10:02:46 +0300126 (void)ib_dealloc_pd(device->pd);
127
128 device->mr = NULL;
Or Gerlitz78ad0a32010-02-08 13:19:21 +0000129 device->tx_cq = NULL;
130 device->rx_cq = NULL;
Or Gerlitz1cfa0a72006-05-11 10:02:46 +0300131 device->pd = NULL;
132}
133
134/**
135 * iser_create_ib_conn_res - Creates FMR pool and Queue-Pair (QP)
136 *
137 * returns 0 on success, -1 on failure
138 */
139static int iser_create_ib_conn_res(struct iser_conn *ib_conn)
140{
141 struct iser_device *device;
142 struct ib_qp_init_attr init_attr;
Or Gerlitzbcc60c32010-02-08 13:17:42 +0000143 int ret = -ENOMEM;
Or Gerlitz1cfa0a72006-05-11 10:02:46 +0300144 struct ib_fmr_pool_param params;
145
146 BUG_ON(ib_conn->device == NULL);
147
148 device = ib_conn->device;
149
Or Gerlitzbcc60c32010-02-08 13:17:42 +0000150 ib_conn->login_buf = kmalloc(ISER_RX_LOGIN_SIZE, GFP_KERNEL);
151 if (!ib_conn->login_buf) {
152 goto alloc_err;
153 ret = -ENOMEM;
154 }
155
156 ib_conn->login_dma = ib_dma_map_single(ib_conn->device->ib_device,
157 (void *)ib_conn->login_buf, ISER_RX_LOGIN_SIZE,
158 DMA_FROM_DEVICE);
159
Or Gerlitz1cfa0a72006-05-11 10:02:46 +0300160 ib_conn->page_vec = kmalloc(sizeof(struct iser_page_vec) +
161 (sizeof(u64) * (ISCSI_ISER_SG_TABLESIZE +1)),
162 GFP_KERNEL);
163 if (!ib_conn->page_vec) {
164 ret = -ENOMEM;
165 goto alloc_err;
166 }
167 ib_conn->page_vec->pages = (u64 *) (ib_conn->page_vec + 1);
168
Erez Zilber8dfa0872006-09-11 12:22:30 +0300169 params.page_shift = SHIFT_4K;
Or Gerlitz1cfa0a72006-05-11 10:02:46 +0300170 /* when the first/last SG element are not start/end *
171 * page aligned, the map whould be of N+1 pages */
172 params.max_pages_per_fmr = ISCSI_ISER_SG_TABLESIZE + 1;
173 /* make the pool size twice the max number of SCSI commands *
174 * the ML is expected to queue, watermark for unmap at 50% */
Mike Christie15482712007-05-30 12:57:19 -0500175 params.pool_size = ISCSI_DEF_XMIT_CMDS_MAX * 2;
176 params.dirty_watermark = ISCSI_DEF_XMIT_CMDS_MAX;
Or Gerlitz1cfa0a72006-05-11 10:02:46 +0300177 params.cache = 0;
178 params.flush_function = NULL;
179 params.access = (IB_ACCESS_LOCAL_WRITE |
180 IB_ACCESS_REMOTE_WRITE |
181 IB_ACCESS_REMOTE_READ);
182
183 ib_conn->fmr_pool = ib_create_fmr_pool(device->pd, &params);
184 if (IS_ERR(ib_conn->fmr_pool)) {
185 ret = PTR_ERR(ib_conn->fmr_pool);
186 goto fmr_pool_err;
187 }
188
189 memset(&init_attr, 0, sizeof init_attr);
190
191 init_attr.event_handler = iser_qp_event_callback;
192 init_attr.qp_context = (void *)ib_conn;
Or Gerlitz78ad0a32010-02-08 13:19:21 +0000193 init_attr.send_cq = device->tx_cq;
194 init_attr.recv_cq = device->rx_cq;
Or Gerlitz1cfa0a72006-05-11 10:02:46 +0300195 init_attr.cap.max_send_wr = ISER_QP_MAX_REQ_DTOS;
196 init_attr.cap.max_recv_wr = ISER_QP_MAX_RECV_DTOS;
Or Gerlitzf19624a2010-02-08 13:19:56 +0000197 init_attr.cap.max_send_sge = 2;
Or Gerlitzbcc60c32010-02-08 13:17:42 +0000198 init_attr.cap.max_recv_sge = 1;
Or Gerlitz1cfa0a72006-05-11 10:02:46 +0300199 init_attr.sq_sig_type = IB_SIGNAL_REQ_WR;
200 init_attr.qp_type = IB_QPT_RC;
201
202 ret = rdma_create_qp(ib_conn->cma_id, device->pd, &init_attr);
203 if (ret)
204 goto qp_err;
205
206 ib_conn->qp = ib_conn->cma_id->qp;
207 iser_err("setting conn %p cma_id %p: fmr_pool %p qp %p\n",
208 ib_conn, ib_conn->cma_id,
209 ib_conn->fmr_pool, ib_conn->cma_id->qp);
210 return ret;
211
212qp_err:
213 (void)ib_destroy_fmr_pool(ib_conn->fmr_pool);
214fmr_pool_err:
215 kfree(ib_conn->page_vec);
Or Gerlitzbcc60c32010-02-08 13:17:42 +0000216 kfree(ib_conn->login_buf);
Or Gerlitz1cfa0a72006-05-11 10:02:46 +0300217alloc_err:
218 iser_err("unable to alloc mem or create resource, err %d\n", ret);
219 return ret;
220}
221
222/**
223 * releases the FMR pool, QP and CMA ID objects, returns 0 on success,
224 * -1 on failure
225 */
226static int iser_free_ib_conn_res(struct iser_conn *ib_conn)
227{
228 BUG_ON(ib_conn == NULL);
229
230 iser_err("freeing conn %p cma_id %p fmr pool %p qp %p\n",
231 ib_conn, ib_conn->cma_id,
232 ib_conn->fmr_pool, ib_conn->qp);
233
234 /* qp is created only once both addr & route are resolved */
235 if (ib_conn->fmr_pool != NULL)
236 ib_destroy_fmr_pool(ib_conn->fmr_pool);
237
238 if (ib_conn->qp != NULL)
239 rdma_destroy_qp(ib_conn->cma_id);
240
241 if (ib_conn->cma_id != NULL)
242 rdma_destroy_id(ib_conn->cma_id);
243
244 ib_conn->fmr_pool = NULL;
245 ib_conn->qp = NULL;
246 ib_conn->cma_id = NULL;
247 kfree(ib_conn->page_vec);
248
249 return 0;
250}
251
252/**
253 * based on the resolved device node GUID see if there already allocated
254 * device for this device. If there's no such, create one.
255 */
256static
257struct iser_device *iser_device_find_by_ib_device(struct rdma_cm_id *cma_id)
258{
Arne Redlich9a378272008-03-04 14:07:22 +0200259 struct iser_device *device;
Or Gerlitz1cfa0a72006-05-11 10:02:46 +0300260
261 mutex_lock(&ig.device_list_mutex);
262
Arne Redlich9a378272008-03-04 14:07:22 +0200263 list_for_each_entry(device, &ig.device_list, ig_list)
Or Gerlitz1cfa0a72006-05-11 10:02:46 +0300264 /* find if there's a match using the node GUID */
265 if (device->ib_device->node_guid == cma_id->device->node_guid)
Arne Redlichd33ed422008-03-04 14:11:54 +0200266 goto inc_refcnt;
Or Gerlitz1cfa0a72006-05-11 10:02:46 +0300267
Arne Redlich9a378272008-03-04 14:07:22 +0200268 device = kzalloc(sizeof *device, GFP_KERNEL);
269 if (device == NULL)
270 goto out;
271
272 /* assign this device to the device */
273 device->ib_device = cma_id->device;
274 /* init the device and link it into ig device list */
275 if (iser_create_device_ib_res(device)) {
276 kfree(device);
277 device = NULL;
278 goto out;
Or Gerlitz1cfa0a72006-05-11 10:02:46 +0300279 }
Arne Redlich9a378272008-03-04 14:07:22 +0200280 list_add(&device->ig_list, &ig.device_list);
281
Arne Redlichd33ed422008-03-04 14:11:54 +0200282inc_refcnt:
Or Gerlitz1cfa0a72006-05-11 10:02:46 +0300283 device->refcount++;
Arne Redlichd33ed422008-03-04 14:11:54 +0200284out:
Or Gerlitz1cfa0a72006-05-11 10:02:46 +0300285 mutex_unlock(&ig.device_list_mutex);
286 return device;
287}
288
289/* if there's no demand for this device, release it */
290static void iser_device_try_release(struct iser_device *device)
291{
292 mutex_lock(&ig.device_list_mutex);
293 device->refcount--;
294 iser_err("device %p refcount %d\n",device,device->refcount);
295 if (!device->refcount) {
296 iser_free_device_ib_res(device);
297 list_del(&device->ig_list);
298 kfree(device);
299 }
300 mutex_unlock(&ig.device_list_mutex);
301}
302
303int iser_conn_state_comp(struct iser_conn *ib_conn,
304 enum iser_ib_conn_state comp)
305{
306 int ret;
307
308 spin_lock_bh(&ib_conn->lock);
309 ret = (ib_conn->state == comp);
310 spin_unlock_bh(&ib_conn->lock);
311 return ret;
312}
313
314static int iser_conn_state_comp_exch(struct iser_conn *ib_conn,
315 enum iser_ib_conn_state comp,
316 enum iser_ib_conn_state exch)
317{
318 int ret;
319
320 spin_lock_bh(&ib_conn->lock);
321 if ((ret = (ib_conn->state == comp)))
322 ib_conn->state = exch;
323 spin_unlock_bh(&ib_conn->lock);
324 return ret;
325}
326
327/**
Roland Dreier41179e22007-07-17 18:37:42 -0700328 * Frees all conn objects and deallocs conn descriptor
329 */
330static void iser_conn_release(struct iser_conn *ib_conn)
331{
332 struct iser_device *device = ib_conn->device;
333
334 BUG_ON(ib_conn->state != ISER_CONN_DOWN);
335
336 mutex_lock(&ig.connlist_mutex);
337 list_del(&ib_conn->conn_list);
338 mutex_unlock(&ig.connlist_mutex);
Or Gerlitzbcc60c32010-02-08 13:17:42 +0000339 iser_free_rx_descriptors(ib_conn);
Roland Dreier41179e22007-07-17 18:37:42 -0700340 iser_free_ib_conn_res(ib_conn);
341 ib_conn->device = NULL;
342 /* on EVENT_ADDR_ERROR there's no device yet for this conn */
343 if (device != NULL)
344 iser_device_try_release(device);
345 if (ib_conn->iser_conn)
346 ib_conn->iser_conn->ib_conn = NULL;
Mike Christie412eeaf2008-05-21 15:54:14 -0500347 iscsi_destroy_endpoint(ib_conn->ep);
Roland Dreier41179e22007-07-17 18:37:42 -0700348}
349
Mike Christieb40977d2008-05-21 15:54:03 -0500350void iser_conn_get(struct iser_conn *ib_conn)
351{
352 atomic_inc(&ib_conn->refcount);
353}
354
355void iser_conn_put(struct iser_conn *ib_conn)
356{
357 if (atomic_dec_and_test(&ib_conn->refcount))
358 iser_conn_release(ib_conn);
Roland Dreier41179e22007-07-17 18:37:42 -0700359}
360
361/**
Or Gerlitz1cfa0a72006-05-11 10:02:46 +0300362 * triggers start of the disconnect procedures and wait for them to be done
363 */
364void iser_conn_terminate(struct iser_conn *ib_conn)
365{
366 int err = 0;
367
368 /* change the ib conn state only if the conn is UP, however always call
369 * rdma_disconnect since this is the only way to cause the CMA to change
370 * the QP state to ERROR
371 */
372
373 iser_conn_state_comp_exch(ib_conn, ISER_CONN_UP, ISER_CONN_TERMINATING);
374 err = rdma_disconnect(ib_conn->cma_id);
375 if (err)
376 iser_err("Failed to disconnect, conn: 0x%p err %d\n",
377 ib_conn,err);
378
379 wait_event_interruptible(ib_conn->wait,
380 ib_conn->state == ISER_CONN_DOWN);
381
Mike Christieb40977d2008-05-21 15:54:03 -0500382 iser_conn_put(ib_conn);
Or Gerlitz1cfa0a72006-05-11 10:02:46 +0300383}
384
385static void iser_connect_error(struct rdma_cm_id *cma_id)
386{
387 struct iser_conn *ib_conn;
388 ib_conn = (struct iser_conn *)cma_id->context;
389
390 ib_conn->state = ISER_CONN_DOWN;
391 wake_up_interruptible(&ib_conn->wait);
392}
393
394static void iser_addr_handler(struct rdma_cm_id *cma_id)
395{
396 struct iser_device *device;
397 struct iser_conn *ib_conn;
398 int ret;
399
400 device = iser_device_find_by_ib_device(cma_id);
Arne Redlichd33ed422008-03-04 14:11:54 +0200401 if (!device) {
402 iser_err("device lookup/creation failed\n");
403 iser_connect_error(cma_id);
404 return;
405 }
406
Or Gerlitz1cfa0a72006-05-11 10:02:46 +0300407 ib_conn = (struct iser_conn *)cma_id->context;
408 ib_conn->device = device;
409
410 ret = rdma_resolve_route(cma_id, 1000);
411 if (ret) {
412 iser_err("resolve route failed: %d\n", ret);
413 iser_connect_error(cma_id);
414 }
Or Gerlitz1cfa0a72006-05-11 10:02:46 +0300415}
416
417static void iser_route_handler(struct rdma_cm_id *cma_id)
418{
419 struct rdma_conn_param conn_param;
420 int ret;
421
422 ret = iser_create_ib_conn_res((struct iser_conn *)cma_id->context);
423 if (ret)
424 goto failure;
425
Or Gerlitz1cfa0a72006-05-11 10:02:46 +0300426 memset(&conn_param, 0, sizeof conn_param);
427 conn_param.responder_resources = 4;
428 conn_param.initiator_depth = 1;
429 conn_param.retry_count = 7;
430 conn_param.rnr_retry_count = 6;
431
432 ret = rdma_connect(cma_id, &conn_param);
433 if (ret) {
434 iser_err("failure connecting: %d\n", ret);
435 goto failure;
436 }
437
438 return;
439failure:
440 iser_connect_error(cma_id);
441}
442
443static void iser_connected_handler(struct rdma_cm_id *cma_id)
444{
445 struct iser_conn *ib_conn;
446
447 ib_conn = (struct iser_conn *)cma_id->context;
448 ib_conn->state = ISER_CONN_UP;
449 wake_up_interruptible(&ib_conn->wait);
450}
451
452static void iser_disconnected_handler(struct rdma_cm_id *cma_id)
453{
454 struct iser_conn *ib_conn;
455
456 ib_conn = (struct iser_conn *)cma_id->context;
457 ib_conn->disc_evt_flag = 1;
458
459 /* getting here when the state is UP means that the conn is being *
460 * terminated asynchronously from the iSCSI layer's perspective. */
461 if (iser_conn_state_comp_exch(ib_conn, ISER_CONN_UP,
462 ISER_CONN_TERMINATING))
463 iscsi_conn_failure(ib_conn->iser_conn->iscsi_conn,
464 ISCSI_ERR_CONN_FAILED);
465
466 /* Complete the termination process if no posts are pending */
Or Gerlitz704315f2010-02-08 13:18:39 +0000467 if (ib_conn->post_recv_buf_count == 0 &&
Or Gerlitz1cfa0a72006-05-11 10:02:46 +0300468 (atomic_read(&ib_conn->post_send_buf_count) == 0)) {
469 ib_conn->state = ISER_CONN_DOWN;
470 wake_up_interruptible(&ib_conn->wait);
471 }
472}
473
474static int iser_cma_handler(struct rdma_cm_id *cma_id, struct rdma_cm_event *event)
475{
476 int ret = 0;
477
478 iser_err("event %d conn %p id %p\n",event->event,cma_id->context,cma_id);
479
480 switch (event->event) {
481 case RDMA_CM_EVENT_ADDR_RESOLVED:
482 iser_addr_handler(cma_id);
483 break;
484 case RDMA_CM_EVENT_ROUTE_RESOLVED:
485 iser_route_handler(cma_id);
486 break;
487 case RDMA_CM_EVENT_ESTABLISHED:
488 iser_connected_handler(cma_id);
489 break;
490 case RDMA_CM_EVENT_ADDR_ERROR:
491 case RDMA_CM_EVENT_ROUTE_ERROR:
492 case RDMA_CM_EVENT_CONNECT_ERROR:
493 case RDMA_CM_EVENT_UNREACHABLE:
494 case RDMA_CM_EVENT_REJECTED:
495 iser_err("event: %d, error: %d\n", event->event, event->status);
496 iser_connect_error(cma_id);
497 break;
498 case RDMA_CM_EVENT_DISCONNECTED:
Or Gerlitz1cfa0a72006-05-11 10:02:46 +0300499 case RDMA_CM_EVENT_DEVICE_REMOVAL:
Or Gerlitz2f5de152008-07-22 14:16:21 -0700500 case RDMA_CM_EVENT_ADDR_CHANGE:
Erez Zilberd97c5172008-04-16 21:09:35 -0700501 iser_disconnected_handler(cma_id);
Or Gerlitz1cfa0a72006-05-11 10:02:46 +0300502 break;
Or Gerlitz1cfa0a72006-05-11 10:02:46 +0300503 default:
Erez Zilbera4ef1452008-01-17 11:51:58 +0200504 iser_err("Unexpected RDMA CM event (%d)\n", event->event);
Or Gerlitz1cfa0a72006-05-11 10:02:46 +0300505 break;
506 }
507 return ret;
508}
509
Mike Christie412eeaf2008-05-21 15:54:14 -0500510void iser_conn_init(struct iser_conn *ib_conn)
Or Gerlitz1cfa0a72006-05-11 10:02:46 +0300511{
Or Gerlitz1cfa0a72006-05-11 10:02:46 +0300512 ib_conn->state = ISER_CONN_INIT;
513 init_waitqueue_head(&ib_conn->wait);
Or Gerlitz704315f2010-02-08 13:18:39 +0000514 ib_conn->post_recv_buf_count = 0;
Or Gerlitz1cfa0a72006-05-11 10:02:46 +0300515 atomic_set(&ib_conn->post_send_buf_count, 0);
Mike Christieb40977d2008-05-21 15:54:03 -0500516 atomic_set(&ib_conn->refcount, 1);
Or Gerlitz1cfa0a72006-05-11 10:02:46 +0300517 INIT_LIST_HEAD(&ib_conn->conn_list);
518 spin_lock_init(&ib_conn->lock);
Or Gerlitz1cfa0a72006-05-11 10:02:46 +0300519}
520
521 /**
522 * starts the process of connecting to the target
Thadeu Lima de Souza Cascardo94e2bd62009-10-16 15:20:49 +0200523 * sleeps until the connection is established or rejected
Or Gerlitz1cfa0a72006-05-11 10:02:46 +0300524 */
525int iser_connect(struct iser_conn *ib_conn,
526 struct sockaddr_in *src_addr,
527 struct sockaddr_in *dst_addr,
528 int non_blocking)
529{
530 struct sockaddr *src, *dst;
531 int err = 0;
532
Harvey Harrison63779432008-10-31 00:56:00 -0700533 sprintf(ib_conn->name, "%pI4:%d",
534 &dst_addr->sin_addr.s_addr, dst_addr->sin_port);
Or Gerlitz1cfa0a72006-05-11 10:02:46 +0300535
536 /* the device is known only --after-- address resolution */
537 ib_conn->device = NULL;
538
Harvey Harrison63779432008-10-31 00:56:00 -0700539 iser_err("connecting to: %pI4, port 0x%x\n",
540 &dst_addr->sin_addr, dst_addr->sin_port);
Or Gerlitz1cfa0a72006-05-11 10:02:46 +0300541
542 ib_conn->state = ISER_CONN_PENDING;
543
544 ib_conn->cma_id = rdma_create_id(iser_cma_handler,
545 (void *)ib_conn,
546 RDMA_PS_TCP);
547 if (IS_ERR(ib_conn->cma_id)) {
548 err = PTR_ERR(ib_conn->cma_id);
549 iser_err("rdma_create_id failed: %d\n", err);
550 goto id_failure;
551 }
552
553 src = (struct sockaddr *)src_addr;
554 dst = (struct sockaddr *)dst_addr;
555 err = rdma_resolve_addr(ib_conn->cma_id, src, dst, 1000);
556 if (err) {
557 iser_err("rdma_resolve_addr failed: %d\n", err);
558 goto addr_failure;
559 }
560
561 if (!non_blocking) {
562 wait_event_interruptible(ib_conn->wait,
563 (ib_conn->state != ISER_CONN_PENDING));
564
565 if (ib_conn->state != ISER_CONN_UP) {
566 err = -EIO;
567 goto connect_failure;
568 }
569 }
570
571 mutex_lock(&ig.connlist_mutex);
572 list_add(&ib_conn->conn_list, &ig.connlist);
573 mutex_unlock(&ig.connlist_mutex);
574 return 0;
575
576id_failure:
577 ib_conn->cma_id = NULL;
578addr_failure:
579 ib_conn->state = ISER_CONN_DOWN;
580connect_failure:
581 iser_conn_release(ib_conn);
582 return err;
583}
584
585/**
Or Gerlitz1cfa0a72006-05-11 10:02:46 +0300586 * iser_reg_page_vec - Register physical memory
587 *
588 * returns: 0 on success, errno code on failure
589 */
590int iser_reg_page_vec(struct iser_conn *ib_conn,
591 struct iser_page_vec *page_vec,
592 struct iser_mem_reg *mem_reg)
593{
594 struct ib_pool_fmr *mem;
595 u64 io_addr;
596 u64 *page_list;
597 int status;
598
599 page_list = page_vec->pages;
600 io_addr = page_list[0];
601
602 mem = ib_fmr_pool_map_phys(ib_conn->fmr_pool,
603 page_list,
604 page_vec->length,
Michael S. Tsirkinadfaa882006-07-14 00:23:55 -0700605 io_addr);
Or Gerlitz1cfa0a72006-05-11 10:02:46 +0300606
607 if (IS_ERR(mem)) {
608 status = (int)PTR_ERR(mem);
609 iser_err("ib_fmr_pool_map_phys failed: %d\n", status);
610 return status;
611 }
612
613 mem_reg->lkey = mem->fmr->lkey;
614 mem_reg->rkey = mem->fmr->rkey;
Erez Zilber8dfa0872006-09-11 12:22:30 +0300615 mem_reg->len = page_vec->length * SIZE_4K;
Or Gerlitz1cfa0a72006-05-11 10:02:46 +0300616 mem_reg->va = io_addr;
Erez Zilberd8111022006-09-11 12:26:33 +0300617 mem_reg->is_fmr = 1;
Or Gerlitz1cfa0a72006-05-11 10:02:46 +0300618 mem_reg->mem_h = (void *)mem;
619
620 mem_reg->va += page_vec->offset;
621 mem_reg->len = page_vec->data_size;
622
623 iser_dbg("PHYSICAL Mem.register, [PHYS p_array: 0x%p, sz: %d, "
624 "entry[0]: (0x%08lx,%ld)] -> "
625 "[lkey: 0x%08X mem_h: 0x%p va: 0x%08lX sz: %ld]\n",
626 page_vec, page_vec->length,
627 (unsigned long)page_vec->pages[0],
628 (unsigned long)page_vec->data_size,
629 (unsigned int)mem_reg->lkey, mem_reg->mem_h,
630 (unsigned long)mem_reg->va, (unsigned long)mem_reg->len);
631 return 0;
632}
633
634/**
635 * Unregister (previosuly registered) memory.
636 */
637void iser_unreg_mem(struct iser_mem_reg *reg)
638{
639 int ret;
640
641 iser_dbg("PHYSICAL Mem.Unregister mem_h %p\n",reg->mem_h);
642
643 ret = ib_fmr_pool_unmap((struct ib_pool_fmr *)reg->mem_h);
644 if (ret)
645 iser_err("ib_fmr_pool_unmap failed %d\n", ret);
646
647 reg->mem_h = NULL;
648}
649
Or Gerlitzbcc60c32010-02-08 13:17:42 +0000650int iser_post_recvl(struct iser_conn *ib_conn)
651{
652 struct ib_recv_wr rx_wr, *rx_wr_failed;
653 struct ib_sge sge;
654 int ib_ret;
655
656 sge.addr = ib_conn->login_dma;
657 sge.length = ISER_RX_LOGIN_SIZE;
658 sge.lkey = ib_conn->device->mr->lkey;
659
660 rx_wr.wr_id = (unsigned long)ib_conn->login_buf;
661 rx_wr.sg_list = &sge;
662 rx_wr.num_sge = 1;
663 rx_wr.next = NULL;
664
Or Gerlitz704315f2010-02-08 13:18:39 +0000665 ib_conn->post_recv_buf_count++;
Or Gerlitzbcc60c32010-02-08 13:17:42 +0000666 ib_ret = ib_post_recv(ib_conn->qp, &rx_wr, &rx_wr_failed);
667 if (ib_ret) {
668 iser_err("ib_post_recv failed ret=%d\n", ib_ret);
Or Gerlitz704315f2010-02-08 13:18:39 +0000669 ib_conn->post_recv_buf_count--;
Or Gerlitzbcc60c32010-02-08 13:17:42 +0000670 }
671 return ib_ret;
672}
673
674int iser_post_recvm(struct iser_conn *ib_conn, int count)
675{
676 struct ib_recv_wr *rx_wr, *rx_wr_failed;
677 int i, ib_ret;
678 unsigned int my_rx_head = ib_conn->rx_desc_head;
679 struct iser_rx_desc *rx_desc;
680
681 for (rx_wr = ib_conn->rx_wr, i = 0; i < count; i++, rx_wr++) {
682 rx_desc = &ib_conn->rx_descs[my_rx_head];
683 rx_wr->wr_id = (unsigned long)rx_desc;
684 rx_wr->sg_list = &rx_desc->rx_sg;
685 rx_wr->num_sge = 1;
686 rx_wr->next = rx_wr + 1;
687 my_rx_head = (my_rx_head + 1) & (ISER_QP_MAX_RECV_DTOS - 1);
688 }
689
690 rx_wr--;
691 rx_wr->next = NULL; /* mark end of work requests list */
692
Or Gerlitz704315f2010-02-08 13:18:39 +0000693 ib_conn->post_recv_buf_count += count;
Or Gerlitzbcc60c32010-02-08 13:17:42 +0000694 ib_ret = ib_post_recv(ib_conn->qp, ib_conn->rx_wr, &rx_wr_failed);
695 if (ib_ret) {
696 iser_err("ib_post_recv failed ret=%d\n", ib_ret);
Or Gerlitz704315f2010-02-08 13:18:39 +0000697 ib_conn->post_recv_buf_count -= count;
Or Gerlitzbcc60c32010-02-08 13:17:42 +0000698 } else
699 ib_conn->rx_desc_head = my_rx_head;
700 return ib_ret;
701}
702
703
Or Gerlitz1cfa0a72006-05-11 10:02:46 +0300704/**
Or Gerlitz1cfa0a72006-05-11 10:02:46 +0300705 * iser_start_send - Initiate a Send DTO operation
706 *
707 * returns 0 on success, -1 on failure
708 */
Or Gerlitzf19624a2010-02-08 13:19:56 +0000709int iser_post_send(struct iser_conn *ib_conn, struct iser_tx_desc *tx_desc)
Or Gerlitz1cfa0a72006-05-11 10:02:46 +0300710{
Or Gerlitzf19624a2010-02-08 13:19:56 +0000711 int ib_ret;
Or Gerlitz1cfa0a72006-05-11 10:02:46 +0300712 struct ib_send_wr send_wr, *send_wr_failed;
Or Gerlitz1cfa0a72006-05-11 10:02:46 +0300713
Or Gerlitzf19624a2010-02-08 13:19:56 +0000714 ib_dma_sync_single_for_device(ib_conn->device->ib_device,
715 tx_desc->dma_addr, ISER_HEADERS_LEN, DMA_TO_DEVICE);
Or Gerlitz1cfa0a72006-05-11 10:02:46 +0300716
717 send_wr.next = NULL;
718 send_wr.wr_id = (unsigned long)tx_desc;
Or Gerlitzf19624a2010-02-08 13:19:56 +0000719 send_wr.sg_list = tx_desc->tx_sg;
720 send_wr.num_sge = tx_desc->num_sge;
Or Gerlitz1cfa0a72006-05-11 10:02:46 +0300721 send_wr.opcode = IB_WR_SEND;
Or Gerlitzf19624a2010-02-08 13:19:56 +0000722 send_wr.send_flags = IB_SEND_SIGNALED;
Or Gerlitz1cfa0a72006-05-11 10:02:46 +0300723
724 atomic_inc(&ib_conn->post_send_buf_count);
725
726 ib_ret = ib_post_send(ib_conn->qp, &send_wr, &send_wr_failed);
727 if (ib_ret) {
Or Gerlitz1cfa0a72006-05-11 10:02:46 +0300728 iser_err("ib_post_send failed, ret:%d\n", ib_ret);
729 atomic_dec(&ib_conn->post_send_buf_count);
Or Gerlitz1cfa0a72006-05-11 10:02:46 +0300730 }
Or Gerlitzf19624a2010-02-08 13:19:56 +0000731 return ib_ret;
Or Gerlitz1cfa0a72006-05-11 10:02:46 +0300732}
733
Or Gerlitzf19624a2010-02-08 13:19:56 +0000734static void iser_handle_comp_error(struct iser_tx_desc *desc,
Or Gerlitzbcc60c32010-02-08 13:17:42 +0000735 struct iser_conn *ib_conn)
Or Gerlitz1cfa0a72006-05-11 10:02:46 +0300736{
Or Gerlitz78ad0a32010-02-08 13:19:21 +0000737 if (desc && desc->type == ISCSI_TX_DATAOUT)
738 kmem_cache_free(ig.desc_cache, desc);
Or Gerlitz1cfa0a72006-05-11 10:02:46 +0300739
Or Gerlitz704315f2010-02-08 13:18:39 +0000740 if (ib_conn->post_recv_buf_count == 0 &&
Erez Zilber1d426d62007-04-01 12:53:43 +0200741 atomic_read(&ib_conn->post_send_buf_count) == 0) {
742 /* getting here when the state is UP means that the conn is *
743 * being terminated asynchronously from the iSCSI layer's *
744 * perspective. */
745 if (iser_conn_state_comp_exch(ib_conn, ISER_CONN_UP,
746 ISER_CONN_TERMINATING))
747 iscsi_conn_failure(ib_conn->iser_conn->iscsi_conn,
748 ISCSI_ERR_CONN_FAILED);
749
750 /* complete the termination process if disconnect event was delivered *
751 * note there are no more non completed posts to the QP */
752 if (ib_conn->disc_evt_flag) {
753 ib_conn->state = ISER_CONN_DOWN;
754 wake_up_interruptible(&ib_conn->wait);
755 }
756 }
Or Gerlitz1cfa0a72006-05-11 10:02:46 +0300757}
758
Or Gerlitz78ad0a32010-02-08 13:19:21 +0000759static int iser_drain_tx_cq(struct iser_device *device)
760{
761 struct ib_cq *cq = device->tx_cq;
762 struct ib_wc wc;
Or Gerlitzf19624a2010-02-08 13:19:56 +0000763 struct iser_tx_desc *tx_desc;
Or Gerlitz78ad0a32010-02-08 13:19:21 +0000764 struct iser_conn *ib_conn;
765 int completed_tx = 0;
766
767 while (ib_poll_cq(cq, 1, &wc) == 1) {
Or Gerlitzf19624a2010-02-08 13:19:56 +0000768 tx_desc = (struct iser_tx_desc *) (unsigned long) wc.wr_id;
Or Gerlitz78ad0a32010-02-08 13:19:21 +0000769 ib_conn = wc.qp->qp_context;
770 if (wc.status == IB_WC_SUCCESS) {
771 if (wc.opcode == IB_WC_SEND)
Or Gerlitzf19624a2010-02-08 13:19:56 +0000772 iser_snd_completion(tx_desc, ib_conn);
Or Gerlitz78ad0a32010-02-08 13:19:21 +0000773 else
774 iser_err("expected opcode %d got %d\n",
775 IB_WC_SEND, wc.opcode);
776 } else {
777 iser_err("tx id %llx status %d vend_err %x\n",
778 wc.wr_id, wc.status, wc.vendor_err);
779 atomic_dec(&ib_conn->post_send_buf_count);
780 iser_handle_comp_error(tx_desc, ib_conn);
781 }
782 completed_tx++;
783 }
784 return completed_tx;
785}
786
787
Or Gerlitz1cfa0a72006-05-11 10:02:46 +0300788static void iser_cq_tasklet_fn(unsigned long data)
789{
790 struct iser_device *device = (struct iser_device *)data;
Or Gerlitz78ad0a32010-02-08 13:19:21 +0000791 struct ib_cq *cq = device->rx_cq;
Or Gerlitz1cfa0a72006-05-11 10:02:46 +0300792 struct ib_wc wc;
Or Gerlitz78ad0a32010-02-08 13:19:21 +0000793 struct iser_rx_desc *desc;
Or Gerlitz1cfa0a72006-05-11 10:02:46 +0300794 unsigned long xfer_len;
Or Gerlitzbcc60c32010-02-08 13:17:42 +0000795 struct iser_conn *ib_conn;
Or Gerlitz78ad0a32010-02-08 13:19:21 +0000796 int completed_tx, completed_rx;
797 completed_tx = completed_rx = 0;
Or Gerlitz1cfa0a72006-05-11 10:02:46 +0300798
799 while (ib_poll_cq(cq, 1, &wc) == 1) {
Or Gerlitz78ad0a32010-02-08 13:19:21 +0000800 desc = (struct iser_rx_desc *) (unsigned long) wc.wr_id;
Or Gerlitz1cfa0a72006-05-11 10:02:46 +0300801 BUG_ON(desc == NULL);
Or Gerlitzbcc60c32010-02-08 13:17:42 +0000802 ib_conn = wc.qp->qp_context;
Or Gerlitz1cfa0a72006-05-11 10:02:46 +0300803 if (wc.status == IB_WC_SUCCESS) {
Or Gerlitzbcc60c32010-02-08 13:17:42 +0000804 if (wc.opcode == IB_WC_RECV) {
Or Gerlitz1cfa0a72006-05-11 10:02:46 +0300805 xfer_len = (unsigned long)wc.byte_len;
Or Gerlitz78ad0a32010-02-08 13:19:21 +0000806 iser_rcv_completion(desc, xfer_len, ib_conn);
807 } else
808 iser_err("expected opcode %d got %d\n",
809 IB_WC_RECV, wc.opcode);
Or Gerlitz1cfa0a72006-05-11 10:02:46 +0300810 } else {
Or Gerlitzbcc60c32010-02-08 13:17:42 +0000811 if (wc.status != IB_WC_WR_FLUSH_ERR)
Or Gerlitz78ad0a32010-02-08 13:19:21 +0000812 iser_err("rx id %llx status %d vend_err %x\n",
Or Gerlitzbcc60c32010-02-08 13:17:42 +0000813 wc.wr_id, wc.status, wc.vendor_err);
Or Gerlitz78ad0a32010-02-08 13:19:21 +0000814 ib_conn->post_recv_buf_count--;
815 iser_handle_comp_error(NULL, ib_conn);
Or Gerlitz1cfa0a72006-05-11 10:02:46 +0300816 }
Or Gerlitz78ad0a32010-02-08 13:19:21 +0000817 completed_rx++;
818 if (!(completed_rx & 63))
819 completed_tx += iser_drain_tx_cq(device);
Or Gerlitz1cfa0a72006-05-11 10:02:46 +0300820 }
821 /* #warning "it is assumed here that arming CQ only once its empty" *
822 * " would not cause interrupts to be missed" */
823 ib_req_notify_cq(cq, IB_CQ_NEXT_COMP);
Or Gerlitz78ad0a32010-02-08 13:19:21 +0000824
825 completed_tx += iser_drain_tx_cq(device);
826 iser_dbg("got %d rx %d tx completions\n", completed_rx, completed_tx);
Or Gerlitz1cfa0a72006-05-11 10:02:46 +0300827}
828
829static void iser_cq_callback(struct ib_cq *cq, void *cq_context)
830{
831 struct iser_device *device = (struct iser_device *)cq_context;
832
833 tasklet_schedule(&device->cq_tasklet);
834}