b1195b1849020081dc3bbd86cf22b8bf086d1324
[platform/adaptation/renesas_rcar/renesas_kernel.git] / drivers / infiniband / ulp / isert / ib_isert.c
1 /*******************************************************************************
2  * This file contains iSCSI extentions for RDMA (iSER) Verbs
3  *
4  * (c) Copyright 2013 Datera, Inc.
5  *
6  * Nicholas A. Bellinger <nab@linux-iscsi.org>
7  *
8  * This program is free software; you can redistribute it and/or modify
9  * it under the terms of the GNU General Public License as published by
10  * the Free Software Foundation; either version 2 of the License, or
11  * (at your option) any later version.
12  *
13  * This program is distributed in the hope that it will be useful,
14  * but WITHOUT ANY WARRANTY; without even the implied warranty of
15  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
16  * GNU General Public License for more details.
17  ****************************************************************************/
18
19 #include <linux/string.h>
20 #include <linux/module.h>
21 #include <linux/scatterlist.h>
22 #include <linux/socket.h>
23 #include <linux/in.h>
24 #include <linux/in6.h>
25 #include <linux/llist.h>
26 #include <rdma/ib_verbs.h>
27 #include <rdma/rdma_cm.h>
28 #include <target/target_core_base.h>
29 #include <target/target_core_fabric.h>
30 #include <target/iscsi/iscsi_transport.h>
31 #include <linux/semaphore.h>
32
33 #include "isert_proto.h"
34 #include "ib_isert.h"
35
36 #define ISERT_MAX_CONN          8
37 #define ISER_MAX_RX_CQ_LEN      (ISERT_QP_MAX_RECV_DTOS * ISERT_MAX_CONN)
38 #define ISER_MAX_TX_CQ_LEN      (ISERT_QP_MAX_REQ_DTOS  * ISERT_MAX_CONN)
39
40 static DEFINE_MUTEX(device_list_mutex);
41 static LIST_HEAD(device_list);
42 static struct workqueue_struct *isert_rx_wq;
43 static struct workqueue_struct *isert_comp_wq;
44
45 static void
46 isert_unmap_cmd(struct isert_cmd *isert_cmd, struct isert_conn *isert_conn);
47 static int
48 isert_map_rdma(struct iscsi_conn *conn, struct iscsi_cmd *cmd,
49                struct isert_rdma_wr *wr);
50 static void
51 isert_unreg_rdma(struct isert_cmd *isert_cmd, struct isert_conn *isert_conn);
52 static int
53 isert_reg_rdma(struct iscsi_conn *conn, struct iscsi_cmd *cmd,
54                struct isert_rdma_wr *wr);
55
56 static void
57 isert_qp_event_callback(struct ib_event *e, void *context)
58 {
59         struct isert_conn *isert_conn = (struct isert_conn *)context;
60
61         pr_err("isert_qp_event_callback event: %d\n", e->event);
62         switch (e->event) {
63         case IB_EVENT_COMM_EST:
64                 rdma_notify(isert_conn->conn_cm_id, IB_EVENT_COMM_EST);
65                 break;
66         case IB_EVENT_QP_LAST_WQE_REACHED:
67                 pr_warn("Reached TX IB_EVENT_QP_LAST_WQE_REACHED:\n");
68                 break;
69         default:
70                 break;
71         }
72 }
73
74 static int
75 isert_query_device(struct ib_device *ib_dev, struct ib_device_attr *devattr)
76 {
77         int ret;
78
79         ret = ib_query_device(ib_dev, devattr);
80         if (ret) {
81                 pr_err("ib_query_device() failed: %d\n", ret);
82                 return ret;
83         }
84         pr_debug("devattr->max_sge: %d\n", devattr->max_sge);
85         pr_debug("devattr->max_sge_rd: %d\n", devattr->max_sge_rd);
86
87         return 0;
88 }
89
90 static int
91 isert_conn_setup_qp(struct isert_conn *isert_conn, struct rdma_cm_id *cma_id)
92 {
93         struct isert_device *device = isert_conn->conn_device;
94         struct ib_qp_init_attr attr;
95         int ret, index, min_index = 0;
96
97         mutex_lock(&device_list_mutex);
98         for (index = 0; index < device->cqs_used; index++)
99                 if (device->cq_active_qps[index] <
100                     device->cq_active_qps[min_index])
101                         min_index = index;
102         device->cq_active_qps[min_index]++;
103         pr_debug("isert_conn_setup_qp: Using min_index: %d\n", min_index);
104         mutex_unlock(&device_list_mutex);
105
106         memset(&attr, 0, sizeof(struct ib_qp_init_attr));
107         attr.event_handler = isert_qp_event_callback;
108         attr.qp_context = isert_conn;
109         attr.send_cq = device->dev_tx_cq[min_index];
110         attr.recv_cq = device->dev_rx_cq[min_index];
111         attr.cap.max_send_wr = ISERT_QP_MAX_REQ_DTOS;
112         attr.cap.max_recv_wr = ISERT_QP_MAX_RECV_DTOS;
113         /*
114          * FIXME: Use devattr.max_sge - 2 for max_send_sge as
115          * work-around for RDMA_READs with ConnectX-2.
116          *
117          * Also, still make sure to have at least two SGEs for
118          * outgoing control PDU responses.
119          */
120         attr.cap.max_send_sge = max(2, device->dev_attr.max_sge - 2);
121         isert_conn->max_sge = attr.cap.max_send_sge;
122
123         attr.cap.max_recv_sge = 1;
124         attr.sq_sig_type = IB_SIGNAL_REQ_WR;
125         attr.qp_type = IB_QPT_RC;
126
127         pr_debug("isert_conn_setup_qp cma_id->device: %p\n",
128                  cma_id->device);
129         pr_debug("isert_conn_setup_qp conn_pd->device: %p\n",
130                  isert_conn->conn_pd->device);
131
132         ret = rdma_create_qp(cma_id, isert_conn->conn_pd, &attr);
133         if (ret) {
134                 pr_err("rdma_create_qp failed for cma_id %d\n", ret);
135                 return ret;
136         }
137         isert_conn->conn_qp = cma_id->qp;
138         pr_debug("rdma_create_qp() returned success >>>>>>>>>>>>>>>>>>>>>>>>>.\n");
139
140         return 0;
141 }
142
143 static void
144 isert_cq_event_callback(struct ib_event *e, void *context)
145 {
146         pr_debug("isert_cq_event_callback event: %d\n", e->event);
147 }
148
149 static int
150 isert_alloc_rx_descriptors(struct isert_conn *isert_conn)
151 {
152         struct ib_device *ib_dev = isert_conn->conn_cm_id->device;
153         struct iser_rx_desc *rx_desc;
154         struct ib_sge *rx_sg;
155         u64 dma_addr;
156         int i, j;
157
158         isert_conn->conn_rx_descs = kzalloc(ISERT_QP_MAX_RECV_DTOS *
159                                 sizeof(struct iser_rx_desc), GFP_KERNEL);
160         if (!isert_conn->conn_rx_descs)
161                 goto fail;
162
163         rx_desc = isert_conn->conn_rx_descs;
164
165         for (i = 0; i < ISERT_QP_MAX_RECV_DTOS; i++, rx_desc++)  {
166                 dma_addr = ib_dma_map_single(ib_dev, (void *)rx_desc,
167                                         ISER_RX_PAYLOAD_SIZE, DMA_FROM_DEVICE);
168                 if (ib_dma_mapping_error(ib_dev, dma_addr))
169                         goto dma_map_fail;
170
171                 rx_desc->dma_addr = dma_addr;
172
173                 rx_sg = &rx_desc->rx_sg;
174                 rx_sg->addr = rx_desc->dma_addr;
175                 rx_sg->length = ISER_RX_PAYLOAD_SIZE;
176                 rx_sg->lkey = isert_conn->conn_mr->lkey;
177         }
178
179         isert_conn->conn_rx_desc_head = 0;
180         return 0;
181
182 dma_map_fail:
183         rx_desc = isert_conn->conn_rx_descs;
184         for (j = 0; j < i; j++, rx_desc++) {
185                 ib_dma_unmap_single(ib_dev, rx_desc->dma_addr,
186                                     ISER_RX_PAYLOAD_SIZE, DMA_FROM_DEVICE);
187         }
188         kfree(isert_conn->conn_rx_descs);
189         isert_conn->conn_rx_descs = NULL;
190 fail:
191         return -ENOMEM;
192 }
193
194 static void
195 isert_free_rx_descriptors(struct isert_conn *isert_conn)
196 {
197         struct ib_device *ib_dev = isert_conn->conn_cm_id->device;
198         struct iser_rx_desc *rx_desc;
199         int i;
200
201         if (!isert_conn->conn_rx_descs)
202                 return;
203
204         rx_desc = isert_conn->conn_rx_descs;
205         for (i = 0; i < ISERT_QP_MAX_RECV_DTOS; i++, rx_desc++)  {
206                 ib_dma_unmap_single(ib_dev, rx_desc->dma_addr,
207                                     ISER_RX_PAYLOAD_SIZE, DMA_FROM_DEVICE);
208         }
209
210         kfree(isert_conn->conn_rx_descs);
211         isert_conn->conn_rx_descs = NULL;
212 }
213
214 static void isert_cq_tx_work(struct work_struct *);
215 static void isert_cq_tx_callback(struct ib_cq *, void *);
216 static void isert_cq_rx_work(struct work_struct *);
217 static void isert_cq_rx_callback(struct ib_cq *, void *);
218
219 static int
220 isert_create_device_ib_res(struct isert_device *device)
221 {
222         struct ib_device *ib_dev = device->ib_device;
223         struct isert_cq_desc *cq_desc;
224         struct ib_device_attr *dev_attr;
225         int ret = 0, i, j;
226         int max_rx_cqe, max_tx_cqe;
227
228         dev_attr = &device->dev_attr;
229         ret = isert_query_device(ib_dev, dev_attr);
230         if (ret)
231                 return ret;
232
233         max_rx_cqe = min(ISER_MAX_RX_CQ_LEN, dev_attr->max_cqe);
234         max_tx_cqe = min(ISER_MAX_TX_CQ_LEN, dev_attr->max_cqe);
235
236         /* asign function handlers */
237         if (dev_attr->device_cap_flags & IB_DEVICE_MEM_MGT_EXTENSIONS) {
238                 device->use_fastreg = 1;
239                 device->reg_rdma_mem = isert_reg_rdma;
240                 device->unreg_rdma_mem = isert_unreg_rdma;
241         } else {
242                 device->use_fastreg = 0;
243                 device->reg_rdma_mem = isert_map_rdma;
244                 device->unreg_rdma_mem = isert_unmap_cmd;
245         }
246
247         device->cqs_used = min_t(int, num_online_cpus(),
248                                  device->ib_device->num_comp_vectors);
249         device->cqs_used = min(ISERT_MAX_CQ, device->cqs_used);
250         pr_debug("Using %d CQs, device %s supports %d vectors support "
251                  "Fast registration %d\n",
252                  device->cqs_used, device->ib_device->name,
253                  device->ib_device->num_comp_vectors, device->use_fastreg);
254         device->cq_desc = kzalloc(sizeof(struct isert_cq_desc) *
255                                 device->cqs_used, GFP_KERNEL);
256         if (!device->cq_desc) {
257                 pr_err("Unable to allocate device->cq_desc\n");
258                 return -ENOMEM;
259         }
260         cq_desc = device->cq_desc;
261
262         for (i = 0; i < device->cqs_used; i++) {
263                 cq_desc[i].device = device;
264                 cq_desc[i].cq_index = i;
265
266                 INIT_WORK(&cq_desc[i].cq_rx_work, isert_cq_rx_work);
267                 device->dev_rx_cq[i] = ib_create_cq(device->ib_device,
268                                                 isert_cq_rx_callback,
269                                                 isert_cq_event_callback,
270                                                 (void *)&cq_desc[i],
271                                                 max_rx_cqe, i);
272                 if (IS_ERR(device->dev_rx_cq[i])) {
273                         ret = PTR_ERR(device->dev_rx_cq[i]);
274                         device->dev_rx_cq[i] = NULL;
275                         goto out_cq;
276                 }
277
278                 INIT_WORK(&cq_desc[i].cq_tx_work, isert_cq_tx_work);
279                 device->dev_tx_cq[i] = ib_create_cq(device->ib_device,
280                                                 isert_cq_tx_callback,
281                                                 isert_cq_event_callback,
282                                                 (void *)&cq_desc[i],
283                                                 max_tx_cqe, i);
284                 if (IS_ERR(device->dev_tx_cq[i])) {
285                         ret = PTR_ERR(device->dev_tx_cq[i]);
286                         device->dev_tx_cq[i] = NULL;
287                         goto out_cq;
288                 }
289
290                 ret = ib_req_notify_cq(device->dev_rx_cq[i], IB_CQ_NEXT_COMP);
291                 if (ret)
292                         goto out_cq;
293
294                 ret = ib_req_notify_cq(device->dev_tx_cq[i], IB_CQ_NEXT_COMP);
295                 if (ret)
296                         goto out_cq;
297         }
298
299         return 0;
300
301 out_cq:
302         for (j = 0; j < i; j++) {
303                 cq_desc = &device->cq_desc[j];
304
305                 if (device->dev_rx_cq[j]) {
306                         cancel_work_sync(&cq_desc->cq_rx_work);
307                         ib_destroy_cq(device->dev_rx_cq[j]);
308                 }
309                 if (device->dev_tx_cq[j]) {
310                         cancel_work_sync(&cq_desc->cq_tx_work);
311                         ib_destroy_cq(device->dev_tx_cq[j]);
312                 }
313         }
314         kfree(device->cq_desc);
315
316         return ret;
317 }
318
319 static void
320 isert_free_device_ib_res(struct isert_device *device)
321 {
322         struct isert_cq_desc *cq_desc;
323         int i;
324
325         for (i = 0; i < device->cqs_used; i++) {
326                 cq_desc = &device->cq_desc[i];
327
328                 cancel_work_sync(&cq_desc->cq_rx_work);
329                 cancel_work_sync(&cq_desc->cq_tx_work);
330                 ib_destroy_cq(device->dev_rx_cq[i]);
331                 ib_destroy_cq(device->dev_tx_cq[i]);
332                 device->dev_rx_cq[i] = NULL;
333                 device->dev_tx_cq[i] = NULL;
334         }
335
336         kfree(device->cq_desc);
337 }
338
339 static void
340 isert_device_try_release(struct isert_device *device)
341 {
342         mutex_lock(&device_list_mutex);
343         device->refcount--;
344         if (!device->refcount) {
345                 isert_free_device_ib_res(device);
346                 list_del(&device->dev_node);
347                 kfree(device);
348         }
349         mutex_unlock(&device_list_mutex);
350 }
351
352 static struct isert_device *
353 isert_device_find_by_ib_dev(struct rdma_cm_id *cma_id)
354 {
355         struct isert_device *device;
356         int ret;
357
358         mutex_lock(&device_list_mutex);
359         list_for_each_entry(device, &device_list, dev_node) {
360                 if (device->ib_device->node_guid == cma_id->device->node_guid) {
361                         device->refcount++;
362                         mutex_unlock(&device_list_mutex);
363                         return device;
364                 }
365         }
366
367         device = kzalloc(sizeof(struct isert_device), GFP_KERNEL);
368         if (!device) {
369                 mutex_unlock(&device_list_mutex);
370                 return ERR_PTR(-ENOMEM);
371         }
372
373         INIT_LIST_HEAD(&device->dev_node);
374
375         device->ib_device = cma_id->device;
376         ret = isert_create_device_ib_res(device);
377         if (ret) {
378                 kfree(device);
379                 mutex_unlock(&device_list_mutex);
380                 return ERR_PTR(ret);
381         }
382
383         device->refcount++;
384         list_add_tail(&device->dev_node, &device_list);
385         mutex_unlock(&device_list_mutex);
386
387         return device;
388 }
389
390 static void
391 isert_conn_free_fastreg_pool(struct isert_conn *isert_conn)
392 {
393         struct fast_reg_descriptor *fr_desc, *tmp;
394         int i = 0;
395
396         if (list_empty(&isert_conn->conn_fr_pool))
397                 return;
398
399         pr_debug("Freeing conn %p fastreg pool", isert_conn);
400
401         list_for_each_entry_safe(fr_desc, tmp,
402                                  &isert_conn->conn_fr_pool, list) {
403                 list_del(&fr_desc->list);
404                 ib_free_fast_reg_page_list(fr_desc->data_frpl);
405                 ib_dereg_mr(fr_desc->data_mr);
406                 kfree(fr_desc);
407                 ++i;
408         }
409
410         if (i < isert_conn->conn_fr_pool_size)
411                 pr_warn("Pool still has %d regions registered\n",
412                         isert_conn->conn_fr_pool_size - i);
413 }
414
415 static int
416 isert_create_fr_desc(struct ib_device *ib_device, struct ib_pd *pd,
417                      struct fast_reg_descriptor *fr_desc)
418 {
419         fr_desc->data_frpl = ib_alloc_fast_reg_page_list(ib_device,
420                                                          ISCSI_ISER_SG_TABLESIZE);
421         if (IS_ERR(fr_desc->data_frpl)) {
422                 pr_err("Failed to allocate data frpl err=%ld\n",
423                        PTR_ERR(fr_desc->data_frpl));
424                 return PTR_ERR(fr_desc->data_frpl);
425         }
426
427         fr_desc->data_mr = ib_alloc_fast_reg_mr(pd, ISCSI_ISER_SG_TABLESIZE);
428         if (IS_ERR(fr_desc->data_mr)) {
429                 pr_err("Failed to allocate data frmr err=%ld\n",
430                        PTR_ERR(fr_desc->data_mr));
431                 ib_free_fast_reg_page_list(fr_desc->data_frpl);
432                 return PTR_ERR(fr_desc->data_mr);
433         }
434         pr_debug("Create fr_desc %p page_list %p\n",
435                  fr_desc, fr_desc->data_frpl->page_list);
436
437         fr_desc->valid = true;
438
439         return 0;
440 }
441
442 static int
443 isert_conn_create_fastreg_pool(struct isert_conn *isert_conn)
444 {
445         struct fast_reg_descriptor *fr_desc;
446         struct isert_device *device = isert_conn->conn_device;
447         struct se_session *se_sess = isert_conn->conn->sess->se_sess;
448         struct se_node_acl *se_nacl = se_sess->se_node_acl;
449         int i, ret, tag_num;
450         /*
451          * Setup the number of FRMRs based upon the number of tags
452          * available to session in iscsi_target_locate_portal().
453          */
454         tag_num = max_t(u32, ISCSIT_MIN_TAGS, se_nacl->queue_depth);
455         tag_num = (tag_num * 2) + ISCSIT_EXTRA_TAGS;
456
457         isert_conn->conn_fr_pool_size = 0;
458         for (i = 0; i < tag_num; i++) {
459                 fr_desc = kzalloc(sizeof(*fr_desc), GFP_KERNEL);
460                 if (!fr_desc) {
461                         pr_err("Failed to allocate fast_reg descriptor\n");
462                         ret = -ENOMEM;
463                         goto err;
464                 }
465
466                 ret = isert_create_fr_desc(device->ib_device,
467                                            isert_conn->conn_pd, fr_desc);
468                 if (ret) {
469                         pr_err("Failed to create fastreg descriptor err=%d\n",
470                                ret);
471                         kfree(fr_desc);
472                         goto err;
473                 }
474
475                 list_add_tail(&fr_desc->list, &isert_conn->conn_fr_pool);
476                 isert_conn->conn_fr_pool_size++;
477         }
478
479         pr_debug("Creating conn %p fastreg pool size=%d",
480                  isert_conn, isert_conn->conn_fr_pool_size);
481
482         return 0;
483
484 err:
485         isert_conn_free_fastreg_pool(isert_conn);
486         return ret;
487 }
488
489 static int
490 isert_connect_request(struct rdma_cm_id *cma_id, struct rdma_cm_event *event)
491 {
492         struct iscsi_np *np = cma_id->context;
493         struct isert_np *isert_np = np->np_context;
494         struct isert_conn *isert_conn;
495         struct isert_device *device;
496         struct ib_device *ib_dev = cma_id->device;
497         int ret = 0;
498
499         spin_lock_bh(&np->np_thread_lock);
500         if (!np->enabled) {
501                 spin_unlock_bh(&np->np_thread_lock);
502                 pr_debug("iscsi_np is not enabled, reject connect request\n");
503                 return rdma_reject(cma_id, NULL, 0);
504         }
505         spin_unlock_bh(&np->np_thread_lock);
506
507         pr_debug("Entering isert_connect_request cma_id: %p, context: %p\n",
508                  cma_id, cma_id->context);
509
510         isert_conn = kzalloc(sizeof(struct isert_conn), GFP_KERNEL);
511         if (!isert_conn) {
512                 pr_err("Unable to allocate isert_conn\n");
513                 return -ENOMEM;
514         }
515         isert_conn->state = ISER_CONN_INIT;
516         INIT_LIST_HEAD(&isert_conn->conn_accept_node);
517         init_completion(&isert_conn->conn_login_comp);
518         init_completion(&isert_conn->conn_wait);
519         init_completion(&isert_conn->conn_wait_comp_err);
520         kref_init(&isert_conn->conn_kref);
521         mutex_init(&isert_conn->conn_mutex);
522         spin_lock_init(&isert_conn->conn_lock);
523         INIT_LIST_HEAD(&isert_conn->conn_fr_pool);
524
525         cma_id->context = isert_conn;
526         isert_conn->conn_cm_id = cma_id;
527         isert_conn->responder_resources = event->param.conn.responder_resources;
528         isert_conn->initiator_depth = event->param.conn.initiator_depth;
529         pr_debug("Using responder_resources: %u initiator_depth: %u\n",
530                  isert_conn->responder_resources, isert_conn->initiator_depth);
531
532         isert_conn->login_buf = kzalloc(ISCSI_DEF_MAX_RECV_SEG_LEN +
533                                         ISER_RX_LOGIN_SIZE, GFP_KERNEL);
534         if (!isert_conn->login_buf) {
535                 pr_err("Unable to allocate isert_conn->login_buf\n");
536                 ret = -ENOMEM;
537                 goto out;
538         }
539
540         isert_conn->login_req_buf = isert_conn->login_buf;
541         isert_conn->login_rsp_buf = isert_conn->login_buf +
542                                     ISCSI_DEF_MAX_RECV_SEG_LEN;
543         pr_debug("Set login_buf: %p login_req_buf: %p login_rsp_buf: %p\n",
544                  isert_conn->login_buf, isert_conn->login_req_buf,
545                  isert_conn->login_rsp_buf);
546
547         isert_conn->login_req_dma = ib_dma_map_single(ib_dev,
548                                 (void *)isert_conn->login_req_buf,
549                                 ISCSI_DEF_MAX_RECV_SEG_LEN, DMA_FROM_DEVICE);
550
551         ret = ib_dma_mapping_error(ib_dev, isert_conn->login_req_dma);
552         if (ret) {
553                 pr_err("ib_dma_mapping_error failed for login_req_dma: %d\n",
554                        ret);
555                 isert_conn->login_req_dma = 0;
556                 goto out_login_buf;
557         }
558
559         isert_conn->login_rsp_dma = ib_dma_map_single(ib_dev,
560                                         (void *)isert_conn->login_rsp_buf,
561                                         ISER_RX_LOGIN_SIZE, DMA_TO_DEVICE);
562
563         ret = ib_dma_mapping_error(ib_dev, isert_conn->login_rsp_dma);
564         if (ret) {
565                 pr_err("ib_dma_mapping_error failed for login_rsp_dma: %d\n",
566                        ret);
567                 isert_conn->login_rsp_dma = 0;
568                 goto out_req_dma_map;
569         }
570
571         device = isert_device_find_by_ib_dev(cma_id);
572         if (IS_ERR(device)) {
573                 ret = PTR_ERR(device);
574                 goto out_rsp_dma_map;
575         }
576
577         isert_conn->conn_device = device;
578         isert_conn->conn_pd = ib_alloc_pd(isert_conn->conn_device->ib_device);
579         if (IS_ERR(isert_conn->conn_pd)) {
580                 ret = PTR_ERR(isert_conn->conn_pd);
581                 pr_err("ib_alloc_pd failed for conn %p: ret=%d\n",
582                        isert_conn, ret);
583                 goto out_pd;
584         }
585
586         isert_conn->conn_mr = ib_get_dma_mr(isert_conn->conn_pd,
587                                            IB_ACCESS_LOCAL_WRITE);
588         if (IS_ERR(isert_conn->conn_mr)) {
589                 ret = PTR_ERR(isert_conn->conn_mr);
590                 pr_err("ib_get_dma_mr failed for conn %p: ret=%d\n",
591                        isert_conn, ret);
592                 goto out_mr;
593         }
594
595         ret = isert_conn_setup_qp(isert_conn, cma_id);
596         if (ret)
597                 goto out_conn_dev;
598
599         mutex_lock(&isert_np->np_accept_mutex);
600         list_add_tail(&isert_conn->conn_accept_node, &isert_np->np_accept_list);
601         mutex_unlock(&isert_np->np_accept_mutex);
602
603         pr_debug("isert_connect_request() up np_sem np: %p\n", np);
604         up(&isert_np->np_sem);
605         return 0;
606
607 out_conn_dev:
608         ib_dereg_mr(isert_conn->conn_mr);
609 out_mr:
610         ib_dealloc_pd(isert_conn->conn_pd);
611 out_pd:
612         isert_device_try_release(device);
613 out_rsp_dma_map:
614         ib_dma_unmap_single(ib_dev, isert_conn->login_rsp_dma,
615                             ISER_RX_LOGIN_SIZE, DMA_TO_DEVICE);
616 out_req_dma_map:
617         ib_dma_unmap_single(ib_dev, isert_conn->login_req_dma,
618                             ISCSI_DEF_MAX_RECV_SEG_LEN, DMA_FROM_DEVICE);
619 out_login_buf:
620         kfree(isert_conn->login_buf);
621 out:
622         kfree(isert_conn);
623         return ret;
624 }
625
626 static void
627 isert_connect_release(struct isert_conn *isert_conn)
628 {
629         struct ib_device *ib_dev = isert_conn->conn_cm_id->device;
630         struct isert_device *device = isert_conn->conn_device;
631         int cq_index;
632
633         pr_debug("Entering isert_connect_release(): >>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>\n");
634
635         if (device && device->use_fastreg)
636                 isert_conn_free_fastreg_pool(isert_conn);
637
638         if (isert_conn->conn_qp) {
639                 cq_index = ((struct isert_cq_desc *)
640                         isert_conn->conn_qp->recv_cq->cq_context)->cq_index;
641                 pr_debug("isert_connect_release: cq_index: %d\n", cq_index);
642                 isert_conn->conn_device->cq_active_qps[cq_index]--;
643
644                 rdma_destroy_qp(isert_conn->conn_cm_id);
645         }
646
647         isert_free_rx_descriptors(isert_conn);
648         rdma_destroy_id(isert_conn->conn_cm_id);
649
650         ib_dereg_mr(isert_conn->conn_mr);
651         ib_dealloc_pd(isert_conn->conn_pd);
652
653         if (isert_conn->login_buf) {
654                 ib_dma_unmap_single(ib_dev, isert_conn->login_rsp_dma,
655                                     ISER_RX_LOGIN_SIZE, DMA_TO_DEVICE);
656                 ib_dma_unmap_single(ib_dev, isert_conn->login_req_dma,
657                                     ISCSI_DEF_MAX_RECV_SEG_LEN,
658                                     DMA_FROM_DEVICE);
659                 kfree(isert_conn->login_buf);
660         }
661         kfree(isert_conn);
662
663         if (device)
664                 isert_device_try_release(device);
665
666         pr_debug("Leaving isert_connect_release >>>>>>>>>>>>\n");
667 }
668
669 static void
670 isert_connected_handler(struct rdma_cm_id *cma_id)
671 {
672         struct isert_conn *isert_conn = cma_id->context;
673
674         kref_get(&isert_conn->conn_kref);
675 }
676
677 static void
678 isert_release_conn_kref(struct kref *kref)
679 {
680         struct isert_conn *isert_conn = container_of(kref,
681                                 struct isert_conn, conn_kref);
682
683         pr_debug("Calling isert_connect_release for final kref %s/%d\n",
684                  current->comm, current->pid);
685
686         isert_connect_release(isert_conn);
687 }
688
689 static void
690 isert_put_conn(struct isert_conn *isert_conn)
691 {
692         kref_put(&isert_conn->conn_kref, isert_release_conn_kref);
693 }
694
695 static void
696 isert_disconnect_work(struct work_struct *work)
697 {
698         struct isert_conn *isert_conn = container_of(work,
699                                 struct isert_conn, conn_logout_work);
700
701         pr_debug("isert_disconnect_work(): >>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>\n");
702         mutex_lock(&isert_conn->conn_mutex);
703         if (isert_conn->state == ISER_CONN_UP)
704                 isert_conn->state = ISER_CONN_TERMINATING;
705
706         if (isert_conn->post_recv_buf_count == 0 &&
707             atomic_read(&isert_conn->post_send_buf_count) == 0) {
708                 mutex_unlock(&isert_conn->conn_mutex);
709                 goto wake_up;
710         }
711         if (!isert_conn->conn_cm_id) {
712                 mutex_unlock(&isert_conn->conn_mutex);
713                 isert_put_conn(isert_conn);
714                 return;
715         }
716
717         if (isert_conn->disconnect) {
718                 /* Send DREQ/DREP towards our initiator */
719                 rdma_disconnect(isert_conn->conn_cm_id);
720         }
721
722         mutex_unlock(&isert_conn->conn_mutex);
723
724 wake_up:
725         complete(&isert_conn->conn_wait);
726 }
727
728 static void
729 isert_disconnected_handler(struct rdma_cm_id *cma_id, bool disconnect)
730 {
731         struct isert_conn *isert_conn = (struct isert_conn *)cma_id->context;
732
733         isert_conn->disconnect = disconnect;
734         INIT_WORK(&isert_conn->conn_logout_work, isert_disconnect_work);
735         schedule_work(&isert_conn->conn_logout_work);
736 }
737
738 static int
739 isert_cma_handler(struct rdma_cm_id *cma_id, struct rdma_cm_event *event)
740 {
741         int ret = 0;
742         bool disconnect = false;
743
744         pr_debug("isert_cma_handler: event %d status %d conn %p id %p\n",
745                  event->event, event->status, cma_id->context, cma_id);
746
747         switch (event->event) {
748         case RDMA_CM_EVENT_CONNECT_REQUEST:
749                 ret = isert_connect_request(cma_id, event);
750                 break;
751         case RDMA_CM_EVENT_ESTABLISHED:
752                 isert_connected_handler(cma_id);
753                 break;
754         case RDMA_CM_EVENT_ADDR_CHANGE:    /* FALLTHRU */
755         case RDMA_CM_EVENT_DISCONNECTED:   /* FALLTHRU */
756         case RDMA_CM_EVENT_DEVICE_REMOVAL: /* FALLTHRU */
757                 disconnect = true;
758         case RDMA_CM_EVENT_TIMEWAIT_EXIT:  /* FALLTHRU */
759                 isert_disconnected_handler(cma_id, disconnect);
760                 break;
761         case RDMA_CM_EVENT_CONNECT_ERROR:
762         default:
763                 pr_err("Unhandled RDMA CMA event: %d\n", event->event);
764                 break;
765         }
766
767         if (ret != 0) {
768                 pr_err("isert_cma_handler failed RDMA_CM_EVENT: 0x%08x %d\n",
769                        event->event, ret);
770                 dump_stack();
771         }
772
773         return ret;
774 }
775
776 static int
777 isert_post_recv(struct isert_conn *isert_conn, u32 count)
778 {
779         struct ib_recv_wr *rx_wr, *rx_wr_failed;
780         int i, ret;
781         unsigned int rx_head = isert_conn->conn_rx_desc_head;
782         struct iser_rx_desc *rx_desc;
783
784         for (rx_wr = isert_conn->conn_rx_wr, i = 0; i < count; i++, rx_wr++) {
785                 rx_desc         = &isert_conn->conn_rx_descs[rx_head];
786                 rx_wr->wr_id    = (unsigned long)rx_desc;
787                 rx_wr->sg_list  = &rx_desc->rx_sg;
788                 rx_wr->num_sge  = 1;
789                 rx_wr->next     = rx_wr + 1;
790                 rx_head = (rx_head + 1) & (ISERT_QP_MAX_RECV_DTOS - 1);
791         }
792
793         rx_wr--;
794         rx_wr->next = NULL; /* mark end of work requests list */
795
796         isert_conn->post_recv_buf_count += count;
797         ret = ib_post_recv(isert_conn->conn_qp, isert_conn->conn_rx_wr,
798                                 &rx_wr_failed);
799         if (ret) {
800                 pr_err("ib_post_recv() failed with ret: %d\n", ret);
801                 isert_conn->post_recv_buf_count -= count;
802         } else {
803                 pr_debug("isert_post_recv(): Posted %d RX buffers\n", count);
804                 isert_conn->conn_rx_desc_head = rx_head;
805         }
806         return ret;
807 }
808
809 static int
810 isert_post_send(struct isert_conn *isert_conn, struct iser_tx_desc *tx_desc)
811 {
812         struct ib_device *ib_dev = isert_conn->conn_cm_id->device;
813         struct ib_send_wr send_wr, *send_wr_failed;
814         int ret;
815
816         ib_dma_sync_single_for_device(ib_dev, tx_desc->dma_addr,
817                                       ISER_HEADERS_LEN, DMA_TO_DEVICE);
818
819         send_wr.next    = NULL;
820         send_wr.wr_id   = (unsigned long)tx_desc;
821         send_wr.sg_list = tx_desc->tx_sg;
822         send_wr.num_sge = tx_desc->num_sge;
823         send_wr.opcode  = IB_WR_SEND;
824         send_wr.send_flags = IB_SEND_SIGNALED;
825
826         atomic_inc(&isert_conn->post_send_buf_count);
827
828         ret = ib_post_send(isert_conn->conn_qp, &send_wr, &send_wr_failed);
829         if (ret) {
830                 pr_err("ib_post_send() failed, ret: %d\n", ret);
831                 atomic_dec(&isert_conn->post_send_buf_count);
832         }
833
834         return ret;
835 }
836
837 static void
838 isert_create_send_desc(struct isert_conn *isert_conn,
839                        struct isert_cmd *isert_cmd,
840                        struct iser_tx_desc *tx_desc)
841 {
842         struct ib_device *ib_dev = isert_conn->conn_cm_id->device;
843
844         ib_dma_sync_single_for_cpu(ib_dev, tx_desc->dma_addr,
845                                    ISER_HEADERS_LEN, DMA_TO_DEVICE);
846
847         memset(&tx_desc->iser_header, 0, sizeof(struct iser_hdr));
848         tx_desc->iser_header.flags = ISER_VER;
849
850         tx_desc->num_sge = 1;
851         tx_desc->isert_cmd = isert_cmd;
852
853         if (tx_desc->tx_sg[0].lkey != isert_conn->conn_mr->lkey) {
854                 tx_desc->tx_sg[0].lkey = isert_conn->conn_mr->lkey;
855                 pr_debug("tx_desc %p lkey mismatch, fixing\n", tx_desc);
856         }
857 }
858
859 static int
860 isert_init_tx_hdrs(struct isert_conn *isert_conn,
861                    struct iser_tx_desc *tx_desc)
862 {
863         struct ib_device *ib_dev = isert_conn->conn_cm_id->device;
864         u64 dma_addr;
865
866         dma_addr = ib_dma_map_single(ib_dev, (void *)tx_desc,
867                         ISER_HEADERS_LEN, DMA_TO_DEVICE);
868         if (ib_dma_mapping_error(ib_dev, dma_addr)) {
869                 pr_err("ib_dma_mapping_error() failed\n");
870                 return -ENOMEM;
871         }
872
873         tx_desc->dma_addr = dma_addr;
874         tx_desc->tx_sg[0].addr  = tx_desc->dma_addr;
875         tx_desc->tx_sg[0].length = ISER_HEADERS_LEN;
876         tx_desc->tx_sg[0].lkey = isert_conn->conn_mr->lkey;
877
878         pr_debug("isert_init_tx_hdrs: Setup tx_sg[0].addr: 0x%llx length: %u"
879                  " lkey: 0x%08x\n", tx_desc->tx_sg[0].addr,
880                  tx_desc->tx_sg[0].length, tx_desc->tx_sg[0].lkey);
881
882         return 0;
883 }
884
885 static void
886 isert_init_send_wr(struct isert_conn *isert_conn, struct isert_cmd *isert_cmd,
887                    struct ib_send_wr *send_wr, bool coalesce)
888 {
889         struct iser_tx_desc *tx_desc = &isert_cmd->tx_desc;
890
891         isert_cmd->rdma_wr.iser_ib_op = ISER_IB_SEND;
892         send_wr->wr_id = (unsigned long)&isert_cmd->tx_desc;
893         send_wr->opcode = IB_WR_SEND;
894         send_wr->sg_list = &tx_desc->tx_sg[0];
895         send_wr->num_sge = isert_cmd->tx_desc.num_sge;
896         /*
897          * Coalesce send completion interrupts by only setting IB_SEND_SIGNALED
898          * bit for every ISERT_COMP_BATCH_COUNT number of ib_post_send() calls.
899          */
900         mutex_lock(&isert_conn->conn_mutex);
901         if (coalesce && isert_conn->state == ISER_CONN_UP &&
902             ++isert_conn->conn_comp_batch < ISERT_COMP_BATCH_COUNT) {
903                 tx_desc->llnode_active = true;
904                 llist_add(&tx_desc->comp_llnode, &isert_conn->conn_comp_llist);
905                 mutex_unlock(&isert_conn->conn_mutex);
906                 return;
907         }
908         isert_conn->conn_comp_batch = 0;
909         tx_desc->comp_llnode_batch = llist_del_all(&isert_conn->conn_comp_llist);
910         mutex_unlock(&isert_conn->conn_mutex);
911
912         send_wr->send_flags = IB_SEND_SIGNALED;
913 }
914
915 static int
916 isert_rdma_post_recvl(struct isert_conn *isert_conn)
917 {
918         struct ib_recv_wr rx_wr, *rx_wr_fail;
919         struct ib_sge sge;
920         int ret;
921
922         memset(&sge, 0, sizeof(struct ib_sge));
923         sge.addr = isert_conn->login_req_dma;
924         sge.length = ISER_RX_LOGIN_SIZE;
925         sge.lkey = isert_conn->conn_mr->lkey;
926
927         pr_debug("Setup sge: addr: %llx length: %d 0x%08x\n",
928                 sge.addr, sge.length, sge.lkey);
929
930         memset(&rx_wr, 0, sizeof(struct ib_recv_wr));
931         rx_wr.wr_id = (unsigned long)isert_conn->login_req_buf;
932         rx_wr.sg_list = &sge;
933         rx_wr.num_sge = 1;
934
935         isert_conn->post_recv_buf_count++;
936         ret = ib_post_recv(isert_conn->conn_qp, &rx_wr, &rx_wr_fail);
937         if (ret) {
938                 pr_err("ib_post_recv() failed: %d\n", ret);
939                 isert_conn->post_recv_buf_count--;
940         }
941
942         pr_debug("ib_post_recv(): returned success >>>>>>>>>>>>>>>>>>>>>>>>\n");
943         return ret;
944 }
945
946 static int
947 isert_put_login_tx(struct iscsi_conn *conn, struct iscsi_login *login,
948                    u32 length)
949 {
950         struct isert_conn *isert_conn = conn->context;
951         struct ib_device *ib_dev = isert_conn->conn_cm_id->device;
952         struct iser_tx_desc *tx_desc = &isert_conn->conn_login_tx_desc;
953         int ret;
954
955         isert_create_send_desc(isert_conn, NULL, tx_desc);
956
957         memcpy(&tx_desc->iscsi_header, &login->rsp[0],
958                sizeof(struct iscsi_hdr));
959
960         isert_init_tx_hdrs(isert_conn, tx_desc);
961
962         if (length > 0) {
963                 struct ib_sge *tx_dsg = &tx_desc->tx_sg[1];
964
965                 ib_dma_sync_single_for_cpu(ib_dev, isert_conn->login_rsp_dma,
966                                            length, DMA_TO_DEVICE);
967
968                 memcpy(isert_conn->login_rsp_buf, login->rsp_buf, length);
969
970                 ib_dma_sync_single_for_device(ib_dev, isert_conn->login_rsp_dma,
971                                               length, DMA_TO_DEVICE);
972
973                 tx_dsg->addr    = isert_conn->login_rsp_dma;
974                 tx_dsg->length  = length;
975                 tx_dsg->lkey    = isert_conn->conn_mr->lkey;
976                 tx_desc->num_sge = 2;
977         }
978         if (!login->login_failed) {
979                 if (login->login_complete) {
980                         if (isert_conn->conn_device->use_fastreg) {
981                                 ret = isert_conn_create_fastreg_pool(isert_conn);
982                                 if (ret) {
983                                         pr_err("Conn: %p failed to create"
984                                                " fastreg pool\n", isert_conn);
985                                         return ret;
986                                 }
987                         }
988
989                         ret = isert_alloc_rx_descriptors(isert_conn);
990                         if (ret)
991                                 return ret;
992
993                         ret = isert_post_recv(isert_conn, ISERT_MIN_POSTED_RX);
994                         if (ret)
995                                 return ret;
996
997                         isert_conn->state = ISER_CONN_UP;
998                         goto post_send;
999                 }
1000
1001                 ret = isert_rdma_post_recvl(isert_conn);
1002                 if (ret)
1003                         return ret;
1004         }
1005 post_send:
1006         ret = isert_post_send(isert_conn, tx_desc);
1007         if (ret)
1008                 return ret;
1009
1010         return 0;
1011 }
1012
1013 static void
1014 isert_rx_login_req(struct iser_rx_desc *rx_desc, int rx_buflen,
1015                    struct isert_conn *isert_conn)
1016 {
1017         struct iscsi_conn *conn = isert_conn->conn;
1018         struct iscsi_login *login = conn->conn_login;
1019         int size;
1020
1021         if (!login) {
1022                 pr_err("conn->conn_login is NULL\n");
1023                 dump_stack();
1024                 return;
1025         }
1026
1027         if (login->first_request) {
1028                 struct iscsi_login_req *login_req =
1029                         (struct iscsi_login_req *)&rx_desc->iscsi_header;
1030                 /*
1031                  * Setup the initial iscsi_login values from the leading
1032                  * login request PDU.
1033                  */
1034                 login->leading_connection = (!login_req->tsih) ? 1 : 0;
1035                 login->current_stage =
1036                         (login_req->flags & ISCSI_FLAG_LOGIN_CURRENT_STAGE_MASK)
1037                          >> 2;
1038                 login->version_min      = login_req->min_version;
1039                 login->version_max      = login_req->max_version;
1040                 memcpy(login->isid, login_req->isid, 6);
1041                 login->cmd_sn           = be32_to_cpu(login_req->cmdsn);
1042                 login->init_task_tag    = login_req->itt;
1043                 login->initial_exp_statsn = be32_to_cpu(login_req->exp_statsn);
1044                 login->cid              = be16_to_cpu(login_req->cid);
1045                 login->tsih             = be16_to_cpu(login_req->tsih);
1046         }
1047
1048         memcpy(&login->req[0], (void *)&rx_desc->iscsi_header, ISCSI_HDR_LEN);
1049
1050         size = min(rx_buflen, MAX_KEY_VALUE_PAIRS);
1051         pr_debug("Using login payload size: %d, rx_buflen: %d MAX_KEY_VALUE_PAIRS: %d\n",
1052                  size, rx_buflen, MAX_KEY_VALUE_PAIRS);
1053         memcpy(login->req_buf, &rx_desc->data[0], size);
1054
1055         if (login->first_request) {
1056                 complete(&isert_conn->conn_login_comp);
1057                 return;
1058         }
1059         schedule_delayed_work(&conn->login_work, 0);
1060 }
1061
1062 static struct iscsi_cmd
1063 *isert_allocate_cmd(struct iscsi_conn *conn)
1064 {
1065         struct isert_conn *isert_conn = (struct isert_conn *)conn->context;
1066         struct isert_cmd *isert_cmd;
1067         struct iscsi_cmd *cmd;
1068
1069         cmd = iscsit_allocate_cmd(conn, TASK_INTERRUPTIBLE);
1070         if (!cmd) {
1071                 pr_err("Unable to allocate iscsi_cmd + isert_cmd\n");
1072                 return NULL;
1073         }
1074         isert_cmd = iscsit_priv_cmd(cmd);
1075         isert_cmd->conn = isert_conn;
1076         isert_cmd->iscsi_cmd = cmd;
1077
1078         return cmd;
1079 }
1080
1081 static int
1082 isert_handle_scsi_cmd(struct isert_conn *isert_conn,
1083                       struct isert_cmd *isert_cmd, struct iscsi_cmd *cmd,
1084                       struct iser_rx_desc *rx_desc, unsigned char *buf)
1085 {
1086         struct iscsi_conn *conn = isert_conn->conn;
1087         struct iscsi_scsi_req *hdr = (struct iscsi_scsi_req *)buf;
1088         struct scatterlist *sg;
1089         int imm_data, imm_data_len, unsol_data, sg_nents, rc;
1090         bool dump_payload = false;
1091
1092         rc = iscsit_setup_scsi_cmd(conn, cmd, buf);
1093         if (rc < 0)
1094                 return rc;
1095
1096         imm_data = cmd->immediate_data;
1097         imm_data_len = cmd->first_burst_len;
1098         unsol_data = cmd->unsolicited_data;
1099
1100         rc = iscsit_process_scsi_cmd(conn, cmd, hdr);
1101         if (rc < 0) {
1102                 return 0;
1103         } else if (rc > 0) {
1104                 dump_payload = true;
1105                 goto sequence_cmd;
1106         }
1107
1108         if (!imm_data)
1109                 return 0;
1110
1111         sg = &cmd->se_cmd.t_data_sg[0];
1112         sg_nents = max(1UL, DIV_ROUND_UP(imm_data_len, PAGE_SIZE));
1113
1114         pr_debug("Copying Immediate SG: %p sg_nents: %u from %p imm_data_len: %d\n",
1115                  sg, sg_nents, &rx_desc->data[0], imm_data_len);
1116
1117         sg_copy_from_buffer(sg, sg_nents, &rx_desc->data[0], imm_data_len);
1118
1119         cmd->write_data_done += imm_data_len;
1120
1121         if (cmd->write_data_done == cmd->se_cmd.data_length) {
1122                 spin_lock_bh(&cmd->istate_lock);
1123                 cmd->cmd_flags |= ICF_GOT_LAST_DATAOUT;
1124                 cmd->i_state = ISTATE_RECEIVED_LAST_DATAOUT;
1125                 spin_unlock_bh(&cmd->istate_lock);
1126         }
1127
1128 sequence_cmd:
1129         rc = iscsit_sequence_cmd(conn, cmd, buf, hdr->cmdsn);
1130
1131         if (!rc && dump_payload == false && unsol_data)
1132                 iscsit_set_unsoliticed_dataout(cmd);
1133         else if (dump_payload && imm_data)
1134                 target_put_sess_cmd(conn->sess->se_sess, &cmd->se_cmd);
1135
1136         return 0;
1137 }
1138
1139 static int
1140 isert_handle_iscsi_dataout(struct isert_conn *isert_conn,
1141                            struct iser_rx_desc *rx_desc, unsigned char *buf)
1142 {
1143         struct scatterlist *sg_start;
1144         struct iscsi_conn *conn = isert_conn->conn;
1145         struct iscsi_cmd *cmd = NULL;
1146         struct iscsi_data *hdr = (struct iscsi_data *)buf;
1147         u32 unsol_data_len = ntoh24(hdr->dlength);
1148         int rc, sg_nents, sg_off, page_off;
1149
1150         rc = iscsit_check_dataout_hdr(conn, buf, &cmd);
1151         if (rc < 0)
1152                 return rc;
1153         else if (!cmd)
1154                 return 0;
1155         /*
1156          * FIXME: Unexpected unsolicited_data out
1157          */
1158         if (!cmd->unsolicited_data) {
1159                 pr_err("Received unexpected solicited data payload\n");
1160                 dump_stack();
1161                 return -1;
1162         }
1163
1164         pr_debug("Unsolicited DataOut unsol_data_len: %u, write_data_done: %u, data_length: %u\n",
1165                  unsol_data_len, cmd->write_data_done, cmd->se_cmd.data_length);
1166
1167         sg_off = cmd->write_data_done / PAGE_SIZE;
1168         sg_start = &cmd->se_cmd.t_data_sg[sg_off];
1169         sg_nents = max(1UL, DIV_ROUND_UP(unsol_data_len, PAGE_SIZE));
1170         page_off = cmd->write_data_done % PAGE_SIZE;
1171         /*
1172          * FIXME: Non page-aligned unsolicited_data out
1173          */
1174         if (page_off) {
1175                 pr_err("Received unexpected non-page aligned data payload\n");
1176                 dump_stack();
1177                 return -1;
1178         }
1179         pr_debug("Copying DataOut: sg_start: %p, sg_off: %u sg_nents: %u from %p %u\n",
1180                  sg_start, sg_off, sg_nents, &rx_desc->data[0], unsol_data_len);
1181
1182         sg_copy_from_buffer(sg_start, sg_nents, &rx_desc->data[0],
1183                             unsol_data_len);
1184
1185         rc = iscsit_check_dataout_payload(cmd, hdr, false);
1186         if (rc < 0)
1187                 return rc;
1188
1189         return 0;
1190 }
1191
1192 static int
1193 isert_handle_nop_out(struct isert_conn *isert_conn, struct isert_cmd *isert_cmd,
1194                      struct iscsi_cmd *cmd, struct iser_rx_desc *rx_desc,
1195                      unsigned char *buf)
1196 {
1197         struct iscsi_conn *conn = isert_conn->conn;
1198         struct iscsi_nopout *hdr = (struct iscsi_nopout *)buf;
1199         int rc;
1200
1201         rc = iscsit_setup_nop_out(conn, cmd, hdr);
1202         if (rc < 0)
1203                 return rc;
1204         /*
1205          * FIXME: Add support for NOPOUT payload using unsolicited RDMA payload
1206          */
1207
1208         return iscsit_process_nop_out(conn, cmd, hdr);
1209 }
1210
1211 static int
1212 isert_handle_text_cmd(struct isert_conn *isert_conn, struct isert_cmd *isert_cmd,
1213                       struct iscsi_cmd *cmd, struct iser_rx_desc *rx_desc,
1214                       struct iscsi_text *hdr)
1215 {
1216         struct iscsi_conn *conn = isert_conn->conn;
1217         u32 payload_length = ntoh24(hdr->dlength);
1218         int rc;
1219         unsigned char *text_in;
1220
1221         rc = iscsit_setup_text_cmd(conn, cmd, hdr);
1222         if (rc < 0)
1223                 return rc;
1224
1225         text_in = kzalloc(payload_length, GFP_KERNEL);
1226         if (!text_in) {
1227                 pr_err("Unable to allocate text_in of payload_length: %u\n",
1228                        payload_length);
1229                 return -ENOMEM;
1230         }
1231         cmd->text_in_ptr = text_in;
1232
1233         memcpy(cmd->text_in_ptr, &rx_desc->data[0], payload_length);
1234
1235         return iscsit_process_text_cmd(conn, cmd, hdr);
1236 }
1237
1238 static int
1239 isert_rx_opcode(struct isert_conn *isert_conn, struct iser_rx_desc *rx_desc,
1240                 uint32_t read_stag, uint64_t read_va,
1241                 uint32_t write_stag, uint64_t write_va)
1242 {
1243         struct iscsi_hdr *hdr = &rx_desc->iscsi_header;
1244         struct iscsi_conn *conn = isert_conn->conn;
1245         struct iscsi_session *sess = conn->sess;
1246         struct iscsi_cmd *cmd;
1247         struct isert_cmd *isert_cmd;
1248         int ret = -EINVAL;
1249         u8 opcode = (hdr->opcode & ISCSI_OPCODE_MASK);
1250
1251         if (sess->sess_ops->SessionType &&
1252            (!(opcode & ISCSI_OP_TEXT) || !(opcode & ISCSI_OP_LOGOUT))) {
1253                 pr_err("Got illegal opcode: 0x%02x in SessionType=Discovery,"
1254                        " ignoring\n", opcode);
1255                 return 0;
1256         }
1257
1258         switch (opcode) {
1259         case ISCSI_OP_SCSI_CMD:
1260                 cmd = isert_allocate_cmd(conn);
1261                 if (!cmd)
1262                         break;
1263
1264                 isert_cmd = iscsit_priv_cmd(cmd);
1265                 isert_cmd->read_stag = read_stag;
1266                 isert_cmd->read_va = read_va;
1267                 isert_cmd->write_stag = write_stag;
1268                 isert_cmd->write_va = write_va;
1269
1270                 ret = isert_handle_scsi_cmd(isert_conn, isert_cmd, cmd,
1271                                         rx_desc, (unsigned char *)hdr);
1272                 break;
1273         case ISCSI_OP_NOOP_OUT:
1274                 cmd = isert_allocate_cmd(conn);
1275                 if (!cmd)
1276                         break;
1277
1278                 isert_cmd = iscsit_priv_cmd(cmd);
1279                 ret = isert_handle_nop_out(isert_conn, isert_cmd, cmd,
1280                                            rx_desc, (unsigned char *)hdr);
1281                 break;
1282         case ISCSI_OP_SCSI_DATA_OUT:
1283                 ret = isert_handle_iscsi_dataout(isert_conn, rx_desc,
1284                                                 (unsigned char *)hdr);
1285                 break;
1286         case ISCSI_OP_SCSI_TMFUNC:
1287                 cmd = isert_allocate_cmd(conn);
1288                 if (!cmd)
1289                         break;
1290
1291                 ret = iscsit_handle_task_mgt_cmd(conn, cmd,
1292                                                 (unsigned char *)hdr);
1293                 break;
1294         case ISCSI_OP_LOGOUT:
1295                 cmd = isert_allocate_cmd(conn);
1296                 if (!cmd)
1297                         break;
1298
1299                 ret = iscsit_handle_logout_cmd(conn, cmd, (unsigned char *)hdr);
1300                 if (ret > 0)
1301                         wait_for_completion_timeout(&conn->conn_logout_comp,
1302                                                     SECONDS_FOR_LOGOUT_COMP *
1303                                                     HZ);
1304                 break;
1305         case ISCSI_OP_TEXT:
1306                 cmd = isert_allocate_cmd(conn);
1307                 if (!cmd)
1308                         break;
1309
1310                 isert_cmd = iscsit_priv_cmd(cmd);
1311                 ret = isert_handle_text_cmd(isert_conn, isert_cmd, cmd,
1312                                             rx_desc, (struct iscsi_text *)hdr);
1313                 break;
1314         default:
1315                 pr_err("Got unknown iSCSI OpCode: 0x%02x\n", opcode);
1316                 dump_stack();
1317                 break;
1318         }
1319
1320         return ret;
1321 }
1322
1323 static void
1324 isert_rx_do_work(struct iser_rx_desc *rx_desc, struct isert_conn *isert_conn)
1325 {
1326         struct iser_hdr *iser_hdr = &rx_desc->iser_header;
1327         uint64_t read_va = 0, write_va = 0;
1328         uint32_t read_stag = 0, write_stag = 0;
1329         int rc;
1330
1331         switch (iser_hdr->flags & 0xF0) {
1332         case ISCSI_CTRL:
1333                 if (iser_hdr->flags & ISER_RSV) {
1334                         read_stag = be32_to_cpu(iser_hdr->read_stag);
1335                         read_va = be64_to_cpu(iser_hdr->read_va);
1336                         pr_debug("ISER_RSV: read_stag: 0x%08x read_va: 0x%16llx\n",
1337                                  read_stag, (unsigned long long)read_va);
1338                 }
1339                 if (iser_hdr->flags & ISER_WSV) {
1340                         write_stag = be32_to_cpu(iser_hdr->write_stag);
1341                         write_va = be64_to_cpu(iser_hdr->write_va);
1342                         pr_debug("ISER_WSV: write__stag: 0x%08x write_va: 0x%16llx\n",
1343                                  write_stag, (unsigned long long)write_va);
1344                 }
1345
1346                 pr_debug("ISER ISCSI_CTRL PDU\n");
1347                 break;
1348         case ISER_HELLO:
1349                 pr_err("iSER Hello message\n");
1350                 break;
1351         default:
1352                 pr_warn("Unknown iSER hdr flags: 0x%02x\n", iser_hdr->flags);
1353                 break;
1354         }
1355
1356         rc = isert_rx_opcode(isert_conn, rx_desc,
1357                              read_stag, read_va, write_stag, write_va);
1358 }
1359
1360 static void
1361 isert_rx_completion(struct iser_rx_desc *desc, struct isert_conn *isert_conn,
1362                     unsigned long xfer_len)
1363 {
1364         struct ib_device *ib_dev = isert_conn->conn_cm_id->device;
1365         struct iscsi_hdr *hdr;
1366         u64 rx_dma;
1367         int rx_buflen, outstanding;
1368
1369         if ((char *)desc == isert_conn->login_req_buf) {
1370                 rx_dma = isert_conn->login_req_dma;
1371                 rx_buflen = ISER_RX_LOGIN_SIZE;
1372                 pr_debug("ISER login_buf: Using rx_dma: 0x%llx, rx_buflen: %d\n",
1373                          rx_dma, rx_buflen);
1374         } else {
1375                 rx_dma = desc->dma_addr;
1376                 rx_buflen = ISER_RX_PAYLOAD_SIZE;
1377                 pr_debug("ISER req_buf: Using rx_dma: 0x%llx, rx_buflen: %d\n",
1378                          rx_dma, rx_buflen);
1379         }
1380
1381         ib_dma_sync_single_for_cpu(ib_dev, rx_dma, rx_buflen, DMA_FROM_DEVICE);
1382
1383         hdr = &desc->iscsi_header;
1384         pr_debug("iSCSI opcode: 0x%02x, ITT: 0x%08x, flags: 0x%02x dlen: %d\n",
1385                  hdr->opcode, hdr->itt, hdr->flags,
1386                  (int)(xfer_len - ISER_HEADERS_LEN));
1387
1388         if ((char *)desc == isert_conn->login_req_buf)
1389                 isert_rx_login_req(desc, xfer_len - ISER_HEADERS_LEN,
1390                                    isert_conn);
1391         else
1392                 isert_rx_do_work(desc, isert_conn);
1393
1394         ib_dma_sync_single_for_device(ib_dev, rx_dma, rx_buflen,
1395                                       DMA_FROM_DEVICE);
1396
1397         isert_conn->post_recv_buf_count--;
1398         pr_debug("iSERT: Decremented post_recv_buf_count: %d\n",
1399                  isert_conn->post_recv_buf_count);
1400
1401         if ((char *)desc == isert_conn->login_req_buf)
1402                 return;
1403
1404         outstanding = isert_conn->post_recv_buf_count;
1405         if (outstanding + ISERT_MIN_POSTED_RX <= ISERT_QP_MAX_RECV_DTOS) {
1406                 int err, count = min(ISERT_QP_MAX_RECV_DTOS - outstanding,
1407                                 ISERT_MIN_POSTED_RX);
1408                 err = isert_post_recv(isert_conn, count);
1409                 if (err) {
1410                         pr_err("isert_post_recv() count: %d failed, %d\n",
1411                                count, err);
1412                 }
1413         }
1414 }
1415
1416 static void
1417 isert_unmap_cmd(struct isert_cmd *isert_cmd, struct isert_conn *isert_conn)
1418 {
1419         struct isert_rdma_wr *wr = &isert_cmd->rdma_wr;
1420         struct ib_device *ib_dev = isert_conn->conn_cm_id->device;
1421
1422         pr_debug("isert_unmap_cmd: %p\n", isert_cmd);
1423         if (wr->sge) {
1424                 pr_debug("isert_unmap_cmd: %p unmap_sg op\n", isert_cmd);
1425                 ib_dma_unmap_sg(ib_dev, wr->sge, wr->num_sge,
1426                                 (wr->iser_ib_op == ISER_IB_RDMA_WRITE) ?
1427                                 DMA_TO_DEVICE : DMA_FROM_DEVICE);
1428                 wr->sge = NULL;
1429         }
1430
1431         if (wr->send_wr) {
1432                 pr_debug("isert_unmap_cmd: %p free send_wr\n", isert_cmd);
1433                 kfree(wr->send_wr);
1434                 wr->send_wr = NULL;
1435         }
1436
1437         if (wr->ib_sge) {
1438                 pr_debug("isert_unmap_cmd: %p free ib_sge\n", isert_cmd);
1439                 kfree(wr->ib_sge);
1440                 wr->ib_sge = NULL;
1441         }
1442 }
1443
1444 static void
1445 isert_unreg_rdma(struct isert_cmd *isert_cmd, struct isert_conn *isert_conn)
1446 {
1447         struct isert_rdma_wr *wr = &isert_cmd->rdma_wr;
1448         struct ib_device *ib_dev = isert_conn->conn_cm_id->device;
1449         LIST_HEAD(unmap_list);
1450
1451         pr_debug("unreg_fastreg_cmd: %p\n", isert_cmd);
1452
1453         if (wr->fr_desc) {
1454                 pr_debug("unreg_fastreg_cmd: %p free fr_desc %p\n",
1455                          isert_cmd, wr->fr_desc);
1456                 spin_lock_bh(&isert_conn->conn_lock);
1457                 list_add_tail(&wr->fr_desc->list, &isert_conn->conn_fr_pool);
1458                 spin_unlock_bh(&isert_conn->conn_lock);
1459                 wr->fr_desc = NULL;
1460         }
1461
1462         if (wr->sge) {
1463                 pr_debug("unreg_fastreg_cmd: %p unmap_sg op\n", isert_cmd);
1464                 ib_dma_unmap_sg(ib_dev, wr->sge, wr->num_sge,
1465                                 (wr->iser_ib_op == ISER_IB_RDMA_WRITE) ?
1466                                 DMA_TO_DEVICE : DMA_FROM_DEVICE);
1467                 wr->sge = NULL;
1468         }
1469
1470         wr->ib_sge = NULL;
1471         wr->send_wr = NULL;
1472 }
1473
1474 static void
1475 isert_put_cmd(struct isert_cmd *isert_cmd, bool comp_err)
1476 {
1477         struct iscsi_cmd *cmd = isert_cmd->iscsi_cmd;
1478         struct isert_conn *isert_conn = isert_cmd->conn;
1479         struct iscsi_conn *conn = isert_conn->conn;
1480         struct isert_device *device = isert_conn->conn_device;
1481
1482         pr_debug("Entering isert_put_cmd: %p\n", isert_cmd);
1483
1484         switch (cmd->iscsi_opcode) {
1485         case ISCSI_OP_SCSI_CMD:
1486                 spin_lock_bh(&conn->cmd_lock);
1487                 if (!list_empty(&cmd->i_conn_node))
1488                         list_del_init(&cmd->i_conn_node);
1489                 spin_unlock_bh(&conn->cmd_lock);
1490
1491                 if (cmd->data_direction == DMA_TO_DEVICE) {
1492                         iscsit_stop_dataout_timer(cmd);
1493                         /*
1494                          * Check for special case during comp_err where
1495                          * WRITE_PENDING has been handed off from core,
1496                          * but requires an extra target_put_sess_cmd()
1497                          * before transport_generic_free_cmd() below.
1498                          */
1499                         if (comp_err &&
1500                             cmd->se_cmd.t_state == TRANSPORT_WRITE_PENDING) {
1501                                 struct se_cmd *se_cmd = &cmd->se_cmd;
1502
1503                                 target_put_sess_cmd(se_cmd->se_sess, se_cmd);
1504                         }
1505                 }
1506
1507                 device->unreg_rdma_mem(isert_cmd, isert_conn);
1508                 transport_generic_free_cmd(&cmd->se_cmd, 0);
1509                 break;
1510         case ISCSI_OP_SCSI_TMFUNC:
1511                 spin_lock_bh(&conn->cmd_lock);
1512                 if (!list_empty(&cmd->i_conn_node))
1513                         list_del_init(&cmd->i_conn_node);
1514                 spin_unlock_bh(&conn->cmd_lock);
1515
1516                 transport_generic_free_cmd(&cmd->se_cmd, 0);
1517                 break;
1518         case ISCSI_OP_REJECT:
1519         case ISCSI_OP_NOOP_OUT:
1520         case ISCSI_OP_TEXT:
1521                 spin_lock_bh(&conn->cmd_lock);
1522                 if (!list_empty(&cmd->i_conn_node))
1523                         list_del_init(&cmd->i_conn_node);
1524                 spin_unlock_bh(&conn->cmd_lock);
1525
1526                 /*
1527                  * Handle special case for REJECT when iscsi_add_reject*() has
1528                  * overwritten the original iscsi_opcode assignment, and the
1529                  * associated cmd->se_cmd needs to be released.
1530                  */
1531                 if (cmd->se_cmd.se_tfo != NULL) {
1532                         pr_debug("Calling transport_generic_free_cmd from"
1533                                  " isert_put_cmd for 0x%02x\n",
1534                                  cmd->iscsi_opcode);
1535                         transport_generic_free_cmd(&cmd->se_cmd, 0);
1536                         break;
1537                 }
1538                 /*
1539                  * Fall-through
1540                  */
1541         default:
1542                 iscsit_release_cmd(cmd);
1543                 break;
1544         }
1545 }
1546
1547 static void
1548 isert_unmap_tx_desc(struct iser_tx_desc *tx_desc, struct ib_device *ib_dev)
1549 {
1550         if (tx_desc->dma_addr != 0) {
1551                 pr_debug("Calling ib_dma_unmap_single for tx_desc->dma_addr\n");
1552                 ib_dma_unmap_single(ib_dev, tx_desc->dma_addr,
1553                                     ISER_HEADERS_LEN, DMA_TO_DEVICE);
1554                 tx_desc->dma_addr = 0;
1555         }
1556 }
1557
1558 static void
1559 isert_completion_put(struct iser_tx_desc *tx_desc, struct isert_cmd *isert_cmd,
1560                      struct ib_device *ib_dev, bool comp_err)
1561 {
1562         if (isert_cmd->pdu_buf_dma != 0) {
1563                 pr_debug("Calling ib_dma_unmap_single for isert_cmd->pdu_buf_dma\n");
1564                 ib_dma_unmap_single(ib_dev, isert_cmd->pdu_buf_dma,
1565                                     isert_cmd->pdu_buf_len, DMA_TO_DEVICE);
1566                 isert_cmd->pdu_buf_dma = 0;
1567         }
1568
1569         isert_unmap_tx_desc(tx_desc, ib_dev);
1570         isert_put_cmd(isert_cmd, comp_err);
1571 }
1572
1573 static void
1574 isert_completion_rdma_read(struct iser_tx_desc *tx_desc,
1575                            struct isert_cmd *isert_cmd)
1576 {
1577         struct isert_rdma_wr *wr = &isert_cmd->rdma_wr;
1578         struct iscsi_cmd *cmd = isert_cmd->iscsi_cmd;
1579         struct se_cmd *se_cmd = &cmd->se_cmd;
1580         struct isert_conn *isert_conn = isert_cmd->conn;
1581         struct isert_device *device = isert_conn->conn_device;
1582
1583         iscsit_stop_dataout_timer(cmd);
1584         device->unreg_rdma_mem(isert_cmd, isert_conn);
1585         cmd->write_data_done = wr->cur_rdma_length;
1586         wr->send_wr_num = 0;
1587
1588         pr_debug("Cmd: %p RDMA_READ comp calling execute_cmd\n", isert_cmd);
1589         spin_lock_bh(&cmd->istate_lock);
1590         cmd->cmd_flags |= ICF_GOT_LAST_DATAOUT;
1591         cmd->i_state = ISTATE_RECEIVED_LAST_DATAOUT;
1592         spin_unlock_bh(&cmd->istate_lock);
1593
1594         target_execute_cmd(se_cmd);
1595 }
1596
1597 static void
1598 isert_do_control_comp(struct work_struct *work)
1599 {
1600         struct isert_cmd *isert_cmd = container_of(work,
1601                         struct isert_cmd, comp_work);
1602         struct isert_conn *isert_conn = isert_cmd->conn;
1603         struct ib_device *ib_dev = isert_conn->conn_cm_id->device;
1604         struct iscsi_cmd *cmd = isert_cmd->iscsi_cmd;
1605
1606         switch (cmd->i_state) {
1607         case ISTATE_SEND_TASKMGTRSP:
1608                 pr_debug("Calling iscsit_tmr_post_handler >>>>>>>>>>>>>>>>>\n");
1609
1610                 atomic_dec(&isert_conn->post_send_buf_count);
1611                 iscsit_tmr_post_handler(cmd, cmd->conn);
1612
1613                 cmd->i_state = ISTATE_SENT_STATUS;
1614                 isert_completion_put(&isert_cmd->tx_desc, isert_cmd, ib_dev, false);
1615                 break;
1616         case ISTATE_SEND_REJECT:
1617                 pr_debug("Got isert_do_control_comp ISTATE_SEND_REJECT: >>>\n");
1618                 atomic_dec(&isert_conn->post_send_buf_count);
1619
1620                 cmd->i_state = ISTATE_SENT_STATUS;
1621                 isert_completion_put(&isert_cmd->tx_desc, isert_cmd, ib_dev, false);
1622                 break;
1623         case ISTATE_SEND_LOGOUTRSP:
1624                 pr_debug("Calling iscsit_logout_post_handler >>>>>>>>>>>>>>\n");
1625
1626                 atomic_dec(&isert_conn->post_send_buf_count);
1627                 iscsit_logout_post_handler(cmd, cmd->conn);
1628                 break;
1629         case ISTATE_SEND_TEXTRSP:
1630                 atomic_dec(&isert_conn->post_send_buf_count);
1631                 cmd->i_state = ISTATE_SENT_STATUS;
1632                 isert_completion_put(&isert_cmd->tx_desc, isert_cmd, ib_dev, false);
1633                 break;
1634         default:
1635                 pr_err("Unknown do_control_comp i_state %d\n", cmd->i_state);
1636                 dump_stack();
1637                 break;
1638         }
1639 }
1640
1641 static void
1642 isert_response_completion(struct iser_tx_desc *tx_desc,
1643                           struct isert_cmd *isert_cmd,
1644                           struct isert_conn *isert_conn,
1645                           struct ib_device *ib_dev)
1646 {
1647         struct iscsi_cmd *cmd = isert_cmd->iscsi_cmd;
1648         struct isert_rdma_wr *wr = &isert_cmd->rdma_wr;
1649
1650         if (cmd->i_state == ISTATE_SEND_TASKMGTRSP ||
1651             cmd->i_state == ISTATE_SEND_LOGOUTRSP ||
1652             cmd->i_state == ISTATE_SEND_REJECT ||
1653             cmd->i_state == ISTATE_SEND_TEXTRSP) {
1654                 isert_unmap_tx_desc(tx_desc, ib_dev);
1655
1656                 INIT_WORK(&isert_cmd->comp_work, isert_do_control_comp);
1657                 queue_work(isert_comp_wq, &isert_cmd->comp_work);
1658                 return;
1659         }
1660         atomic_sub(wr->send_wr_num + 1, &isert_conn->post_send_buf_count);
1661
1662         cmd->i_state = ISTATE_SENT_STATUS;
1663         isert_completion_put(tx_desc, isert_cmd, ib_dev, false);
1664 }
1665
1666 static void
1667 __isert_send_completion(struct iser_tx_desc *tx_desc,
1668                         struct isert_conn *isert_conn)
1669 {
1670         struct ib_device *ib_dev = isert_conn->conn_cm_id->device;
1671         struct isert_cmd *isert_cmd = tx_desc->isert_cmd;
1672         struct isert_rdma_wr *wr;
1673
1674         if (!isert_cmd) {
1675                 atomic_dec(&isert_conn->post_send_buf_count);
1676                 isert_unmap_tx_desc(tx_desc, ib_dev);
1677                 return;
1678         }
1679         wr = &isert_cmd->rdma_wr;
1680
1681         switch (wr->iser_ib_op) {
1682         case ISER_IB_RECV:
1683                 pr_err("isert_send_completion: Got ISER_IB_RECV\n");
1684                 dump_stack();
1685                 break;
1686         case ISER_IB_SEND:
1687                 pr_debug("isert_send_completion: Got ISER_IB_SEND\n");
1688                 isert_response_completion(tx_desc, isert_cmd,
1689                                           isert_conn, ib_dev);
1690                 break;
1691         case ISER_IB_RDMA_WRITE:
1692                 pr_err("isert_send_completion: Got ISER_IB_RDMA_WRITE\n");
1693                 dump_stack();
1694                 break;
1695         case ISER_IB_RDMA_READ:
1696                 pr_debug("isert_send_completion: Got ISER_IB_RDMA_READ:\n");
1697
1698                 atomic_sub(wr->send_wr_num, &isert_conn->post_send_buf_count);
1699                 isert_completion_rdma_read(tx_desc, isert_cmd);
1700                 break;
1701         default:
1702                 pr_err("Unknown wr->iser_ib_op: 0x%02x\n", wr->iser_ib_op);
1703                 dump_stack();
1704                 break;
1705         }
1706 }
1707
1708 static void
1709 isert_send_completion(struct iser_tx_desc *tx_desc,
1710                       struct isert_conn *isert_conn)
1711 {
1712         struct llist_node *llnode = tx_desc->comp_llnode_batch;
1713         struct iser_tx_desc *t;
1714         /*
1715          * Drain coalesced completion llist starting from comp_llnode_batch
1716          * setup in isert_init_send_wr(), and then complete trailing tx_desc.
1717          */
1718         while (llnode) {
1719                 t = llist_entry(llnode, struct iser_tx_desc, comp_llnode);
1720                 llnode = llist_next(llnode);
1721                 __isert_send_completion(t, isert_conn);
1722         }
1723         __isert_send_completion(tx_desc, isert_conn);
1724 }
1725
1726 static void
1727 isert_cq_drain_comp_llist(struct isert_conn *isert_conn, struct ib_device *ib_dev)
1728 {
1729         struct llist_node *llnode;
1730         struct isert_rdma_wr *wr;
1731         struct iser_tx_desc *t;
1732
1733         mutex_lock(&isert_conn->conn_mutex);
1734         llnode = llist_del_all(&isert_conn->conn_comp_llist);
1735         isert_conn->conn_comp_batch = 0;
1736         mutex_unlock(&isert_conn->conn_mutex);
1737
1738         while (llnode) {
1739                 t = llist_entry(llnode, struct iser_tx_desc, comp_llnode);
1740                 llnode = llist_next(llnode);
1741                 wr = &t->isert_cmd->rdma_wr;
1742
1743                 atomic_sub(wr->send_wr_num + 1, &isert_conn->post_send_buf_count);
1744                 isert_completion_put(t, t->isert_cmd, ib_dev, true);
1745         }
1746 }
1747
1748 static void
1749 isert_cq_tx_comp_err(struct iser_tx_desc *tx_desc, struct isert_conn *isert_conn)
1750 {
1751         struct ib_device *ib_dev = isert_conn->conn_cm_id->device;
1752         struct isert_cmd *isert_cmd = tx_desc->isert_cmd;
1753         struct llist_node *llnode = tx_desc->comp_llnode_batch;
1754         struct isert_rdma_wr *wr;
1755         struct iser_tx_desc *t;
1756
1757         while (llnode) {
1758                 t = llist_entry(llnode, struct iser_tx_desc, comp_llnode);
1759                 llnode = llist_next(llnode);
1760                 wr = &t->isert_cmd->rdma_wr;
1761
1762                 atomic_sub(wr->send_wr_num + 1, &isert_conn->post_send_buf_count);
1763                 isert_completion_put(t, t->isert_cmd, ib_dev, true);
1764         }
1765         tx_desc->comp_llnode_batch = NULL;
1766
1767         if (!isert_cmd)
1768                 isert_unmap_tx_desc(tx_desc, ib_dev);
1769         else
1770                 isert_completion_put(tx_desc, isert_cmd, ib_dev, true);
1771 }
1772
1773 static void
1774 isert_cq_rx_comp_err(struct isert_conn *isert_conn)
1775 {
1776         struct ib_device *ib_dev = isert_conn->conn_cm_id->device;
1777         struct iscsi_conn *conn = isert_conn->conn;
1778
1779         if (isert_conn->post_recv_buf_count)
1780                 return;
1781
1782         isert_cq_drain_comp_llist(isert_conn, ib_dev);
1783
1784         if (conn->sess) {
1785                 target_sess_cmd_list_set_waiting(conn->sess->se_sess);
1786                 target_wait_for_sess_cmds(conn->sess->se_sess);
1787         }
1788
1789         while (atomic_read(&isert_conn->post_send_buf_count))
1790                 msleep(3000);
1791
1792         mutex_lock(&isert_conn->conn_mutex);
1793         isert_conn->state = ISER_CONN_DOWN;
1794         mutex_unlock(&isert_conn->conn_mutex);
1795
1796         iscsit_cause_connection_reinstatement(isert_conn->conn, 0);
1797
1798         complete(&isert_conn->conn_wait_comp_err);
1799 }
1800
1801 static void
1802 isert_cq_tx_work(struct work_struct *work)
1803 {
1804         struct isert_cq_desc *cq_desc = container_of(work,
1805                                 struct isert_cq_desc, cq_tx_work);
1806         struct isert_device *device = cq_desc->device;
1807         int cq_index = cq_desc->cq_index;
1808         struct ib_cq *tx_cq = device->dev_tx_cq[cq_index];
1809         struct isert_conn *isert_conn;
1810         struct iser_tx_desc *tx_desc;
1811         struct ib_wc wc;
1812
1813         while (ib_poll_cq(tx_cq, 1, &wc) == 1) {
1814                 tx_desc = (struct iser_tx_desc *)(unsigned long)wc.wr_id;
1815                 isert_conn = wc.qp->qp_context;
1816
1817                 if (wc.status == IB_WC_SUCCESS) {
1818                         isert_send_completion(tx_desc, isert_conn);
1819                 } else {
1820                         pr_debug("TX wc.status != IB_WC_SUCCESS >>>>>>>>>>>>>>\n");
1821                         pr_debug("TX wc.status: 0x%08x\n", wc.status);
1822                         pr_debug("TX wc.vendor_err: 0x%08x\n", wc.vendor_err);
1823
1824                         if (wc.wr_id != ISER_FASTREG_LI_WRID) {
1825                                 if (tx_desc->llnode_active)
1826                                         continue;
1827
1828                                 atomic_dec(&isert_conn->post_send_buf_count);
1829                                 isert_cq_tx_comp_err(tx_desc, isert_conn);
1830                         }
1831                 }
1832         }
1833
1834         ib_req_notify_cq(tx_cq, IB_CQ_NEXT_COMP);
1835 }
1836
1837 static void
1838 isert_cq_tx_callback(struct ib_cq *cq, void *context)
1839 {
1840         struct isert_cq_desc *cq_desc = (struct isert_cq_desc *)context;
1841
1842         queue_work(isert_comp_wq, &cq_desc->cq_tx_work);
1843 }
1844
1845 static void
1846 isert_cq_rx_work(struct work_struct *work)
1847 {
1848         struct isert_cq_desc *cq_desc = container_of(work,
1849                         struct isert_cq_desc, cq_rx_work);
1850         struct isert_device *device = cq_desc->device;
1851         int cq_index = cq_desc->cq_index;
1852         struct ib_cq *rx_cq = device->dev_rx_cq[cq_index];
1853         struct isert_conn *isert_conn;
1854         struct iser_rx_desc *rx_desc;
1855         struct ib_wc wc;
1856         unsigned long xfer_len;
1857
1858         while (ib_poll_cq(rx_cq, 1, &wc) == 1) {
1859                 rx_desc = (struct iser_rx_desc *)(unsigned long)wc.wr_id;
1860                 isert_conn = wc.qp->qp_context;
1861
1862                 if (wc.status == IB_WC_SUCCESS) {
1863                         xfer_len = (unsigned long)wc.byte_len;
1864                         isert_rx_completion(rx_desc, isert_conn, xfer_len);
1865                 } else {
1866                         pr_debug("RX wc.status != IB_WC_SUCCESS >>>>>>>>>>>>>>\n");
1867                         if (wc.status != IB_WC_WR_FLUSH_ERR) {
1868                                 pr_debug("RX wc.status: 0x%08x\n", wc.status);
1869                                 pr_debug("RX wc.vendor_err: 0x%08x\n",
1870                                          wc.vendor_err);
1871                         }
1872                         isert_conn->post_recv_buf_count--;
1873                         isert_cq_rx_comp_err(isert_conn);
1874                 }
1875         }
1876
1877         ib_req_notify_cq(rx_cq, IB_CQ_NEXT_COMP);
1878 }
1879
1880 static void
1881 isert_cq_rx_callback(struct ib_cq *cq, void *context)
1882 {
1883         struct isert_cq_desc *cq_desc = (struct isert_cq_desc *)context;
1884
1885         queue_work(isert_rx_wq, &cq_desc->cq_rx_work);
1886 }
1887
1888 static int
1889 isert_post_response(struct isert_conn *isert_conn, struct isert_cmd *isert_cmd)
1890 {
1891         struct ib_send_wr *wr_failed;
1892         int ret;
1893
1894         atomic_inc(&isert_conn->post_send_buf_count);
1895
1896         ret = ib_post_send(isert_conn->conn_qp, &isert_cmd->tx_desc.send_wr,
1897                            &wr_failed);
1898         if (ret) {
1899                 pr_err("ib_post_send failed with %d\n", ret);
1900                 atomic_dec(&isert_conn->post_send_buf_count);
1901                 return ret;
1902         }
1903         return ret;
1904 }
1905
1906 static int
1907 isert_put_response(struct iscsi_conn *conn, struct iscsi_cmd *cmd)
1908 {
1909         struct isert_cmd *isert_cmd = iscsit_priv_cmd(cmd);
1910         struct isert_conn *isert_conn = (struct isert_conn *)conn->context;
1911         struct ib_send_wr *send_wr = &isert_cmd->tx_desc.send_wr;
1912         struct iscsi_scsi_rsp *hdr = (struct iscsi_scsi_rsp *)
1913                                 &isert_cmd->tx_desc.iscsi_header;
1914
1915         isert_create_send_desc(isert_conn, isert_cmd, &isert_cmd->tx_desc);
1916         iscsit_build_rsp_pdu(cmd, conn, true, hdr);
1917         isert_init_tx_hdrs(isert_conn, &isert_cmd->tx_desc);
1918         /*
1919          * Attach SENSE DATA payload to iSCSI Response PDU
1920          */
1921         if (cmd->se_cmd.sense_buffer &&
1922             ((cmd->se_cmd.se_cmd_flags & SCF_TRANSPORT_TASK_SENSE) ||
1923             (cmd->se_cmd.se_cmd_flags & SCF_EMULATED_TASK_SENSE))) {
1924                 struct ib_device *ib_dev = isert_conn->conn_cm_id->device;
1925                 struct ib_sge *tx_dsg = &isert_cmd->tx_desc.tx_sg[1];
1926                 u32 padding, pdu_len;
1927
1928                 put_unaligned_be16(cmd->se_cmd.scsi_sense_length,
1929                                    cmd->sense_buffer);
1930                 cmd->se_cmd.scsi_sense_length += sizeof(__be16);
1931
1932                 padding = -(cmd->se_cmd.scsi_sense_length) & 3;
1933                 hton24(hdr->dlength, (u32)cmd->se_cmd.scsi_sense_length);
1934                 pdu_len = cmd->se_cmd.scsi_sense_length + padding;
1935
1936                 isert_cmd->pdu_buf_dma = ib_dma_map_single(ib_dev,
1937                                 (void *)cmd->sense_buffer, pdu_len,
1938                                 DMA_TO_DEVICE);
1939
1940                 isert_cmd->pdu_buf_len = pdu_len;
1941                 tx_dsg->addr    = isert_cmd->pdu_buf_dma;
1942                 tx_dsg->length  = pdu_len;
1943                 tx_dsg->lkey    = isert_conn->conn_mr->lkey;
1944                 isert_cmd->tx_desc.num_sge = 2;
1945         }
1946
1947         isert_init_send_wr(isert_conn, isert_cmd, send_wr, true);
1948
1949         pr_debug("Posting SCSI Response IB_WR_SEND >>>>>>>>>>>>>>>>>>>>>>\n");
1950
1951         return isert_post_response(isert_conn, isert_cmd);
1952 }
1953
1954 static int
1955 isert_put_nopin(struct iscsi_cmd *cmd, struct iscsi_conn *conn,
1956                 bool nopout_response)
1957 {
1958         struct isert_cmd *isert_cmd = iscsit_priv_cmd(cmd);
1959         struct isert_conn *isert_conn = (struct isert_conn *)conn->context;
1960         struct ib_send_wr *send_wr = &isert_cmd->tx_desc.send_wr;
1961
1962         isert_create_send_desc(isert_conn, isert_cmd, &isert_cmd->tx_desc);
1963         iscsit_build_nopin_rsp(cmd, conn, (struct iscsi_nopin *)
1964                                &isert_cmd->tx_desc.iscsi_header,
1965                                nopout_response);
1966         isert_init_tx_hdrs(isert_conn, &isert_cmd->tx_desc);
1967         isert_init_send_wr(isert_conn, isert_cmd, send_wr, false);
1968
1969         pr_debug("Posting NOPIN Response IB_WR_SEND >>>>>>>>>>>>>>>>>>>>>>\n");
1970
1971         return isert_post_response(isert_conn, isert_cmd);
1972 }
1973
1974 static int
1975 isert_put_logout_rsp(struct iscsi_cmd *cmd, struct iscsi_conn *conn)
1976 {
1977         struct isert_cmd *isert_cmd = iscsit_priv_cmd(cmd);
1978         struct isert_conn *isert_conn = (struct isert_conn *)conn->context;
1979         struct ib_send_wr *send_wr = &isert_cmd->tx_desc.send_wr;
1980
1981         isert_create_send_desc(isert_conn, isert_cmd, &isert_cmd->tx_desc);
1982         iscsit_build_logout_rsp(cmd, conn, (struct iscsi_logout_rsp *)
1983                                 &isert_cmd->tx_desc.iscsi_header);
1984         isert_init_tx_hdrs(isert_conn, &isert_cmd->tx_desc);
1985         isert_init_send_wr(isert_conn, isert_cmd, send_wr, false);
1986
1987         pr_debug("Posting Logout Response IB_WR_SEND >>>>>>>>>>>>>>>>>>>>>>\n");
1988
1989         return isert_post_response(isert_conn, isert_cmd);
1990 }
1991
1992 static int
1993 isert_put_tm_rsp(struct iscsi_cmd *cmd, struct iscsi_conn *conn)
1994 {
1995         struct isert_cmd *isert_cmd = iscsit_priv_cmd(cmd);
1996         struct isert_conn *isert_conn = (struct isert_conn *)conn->context;
1997         struct ib_send_wr *send_wr = &isert_cmd->tx_desc.send_wr;
1998
1999         isert_create_send_desc(isert_conn, isert_cmd, &isert_cmd->tx_desc);
2000         iscsit_build_task_mgt_rsp(cmd, conn, (struct iscsi_tm_rsp *)
2001                                   &isert_cmd->tx_desc.iscsi_header);
2002         isert_init_tx_hdrs(isert_conn, &isert_cmd->tx_desc);
2003         isert_init_send_wr(isert_conn, isert_cmd, send_wr, false);
2004
2005         pr_debug("Posting Task Management Response IB_WR_SEND >>>>>>>>>>>>>>>>>>>>>>\n");
2006
2007         return isert_post_response(isert_conn, isert_cmd);
2008 }
2009
2010 static int
2011 isert_put_reject(struct iscsi_cmd *cmd, struct iscsi_conn *conn)
2012 {
2013         struct isert_cmd *isert_cmd = iscsit_priv_cmd(cmd);
2014         struct isert_conn *isert_conn = (struct isert_conn *)conn->context;
2015         struct ib_send_wr *send_wr = &isert_cmd->tx_desc.send_wr;
2016         struct ib_device *ib_dev = isert_conn->conn_cm_id->device;
2017         struct ib_sge *tx_dsg = &isert_cmd->tx_desc.tx_sg[1];
2018         struct iscsi_reject *hdr =
2019                 (struct iscsi_reject *)&isert_cmd->tx_desc.iscsi_header;
2020
2021         isert_create_send_desc(isert_conn, isert_cmd, &isert_cmd->tx_desc);
2022         iscsit_build_reject(cmd, conn, hdr);
2023         isert_init_tx_hdrs(isert_conn, &isert_cmd->tx_desc);
2024
2025         hton24(hdr->dlength, ISCSI_HDR_LEN);
2026         isert_cmd->pdu_buf_dma = ib_dma_map_single(ib_dev,
2027                         (void *)cmd->buf_ptr, ISCSI_HDR_LEN,
2028                         DMA_TO_DEVICE);
2029         isert_cmd->pdu_buf_len = ISCSI_HDR_LEN;
2030         tx_dsg->addr    = isert_cmd->pdu_buf_dma;
2031         tx_dsg->length  = ISCSI_HDR_LEN;
2032         tx_dsg->lkey    = isert_conn->conn_mr->lkey;
2033         isert_cmd->tx_desc.num_sge = 2;
2034
2035         isert_init_send_wr(isert_conn, isert_cmd, send_wr, false);
2036
2037         pr_debug("Posting Reject IB_WR_SEND >>>>>>>>>>>>>>>>>>>>>>\n");
2038
2039         return isert_post_response(isert_conn, isert_cmd);
2040 }
2041
2042 static int
2043 isert_put_text_rsp(struct iscsi_cmd *cmd, struct iscsi_conn *conn)
2044 {
2045         struct isert_cmd *isert_cmd = iscsit_priv_cmd(cmd);
2046         struct isert_conn *isert_conn = (struct isert_conn *)conn->context;
2047         struct ib_send_wr *send_wr = &isert_cmd->tx_desc.send_wr;
2048         struct iscsi_text_rsp *hdr =
2049                 (struct iscsi_text_rsp *)&isert_cmd->tx_desc.iscsi_header;
2050         u32 txt_rsp_len;
2051         int rc;
2052
2053         isert_create_send_desc(isert_conn, isert_cmd, &isert_cmd->tx_desc);
2054         rc = iscsit_build_text_rsp(cmd, conn, hdr, ISCSI_INFINIBAND);
2055         if (rc < 0)
2056                 return rc;
2057
2058         txt_rsp_len = rc;
2059         isert_init_tx_hdrs(isert_conn, &isert_cmd->tx_desc);
2060
2061         if (txt_rsp_len) {
2062                 struct ib_device *ib_dev = isert_conn->conn_cm_id->device;
2063                 struct ib_sge *tx_dsg = &isert_cmd->tx_desc.tx_sg[1];
2064                 void *txt_rsp_buf = cmd->buf_ptr;
2065
2066                 isert_cmd->pdu_buf_dma = ib_dma_map_single(ib_dev,
2067                                 txt_rsp_buf, txt_rsp_len, DMA_TO_DEVICE);
2068
2069                 isert_cmd->pdu_buf_len = txt_rsp_len;
2070                 tx_dsg->addr    = isert_cmd->pdu_buf_dma;
2071                 tx_dsg->length  = txt_rsp_len;
2072                 tx_dsg->lkey    = isert_conn->conn_mr->lkey;
2073                 isert_cmd->tx_desc.num_sge = 2;
2074         }
2075         isert_init_send_wr(isert_conn, isert_cmd, send_wr, false);
2076
2077         pr_debug("Posting Text Response IB_WR_SEND >>>>>>>>>>>>>>>>>>>>>>\n");
2078
2079         return isert_post_response(isert_conn, isert_cmd);
2080 }
2081
2082 static int
2083 isert_build_rdma_wr(struct isert_conn *isert_conn, struct isert_cmd *isert_cmd,
2084                     struct ib_sge *ib_sge, struct ib_send_wr *send_wr,
2085                     u32 data_left, u32 offset)
2086 {
2087         struct iscsi_cmd *cmd = isert_cmd->iscsi_cmd;
2088         struct scatterlist *sg_start, *tmp_sg;
2089         struct ib_device *ib_dev = isert_conn->conn_cm_id->device;
2090         u32 sg_off, page_off;
2091         int i = 0, sg_nents;
2092
2093         sg_off = offset / PAGE_SIZE;
2094         sg_start = &cmd->se_cmd.t_data_sg[sg_off];
2095         sg_nents = min(cmd->se_cmd.t_data_nents - sg_off, isert_conn->max_sge);
2096         page_off = offset % PAGE_SIZE;
2097
2098         send_wr->sg_list = ib_sge;
2099         send_wr->num_sge = sg_nents;
2100         send_wr->wr_id = (unsigned long)&isert_cmd->tx_desc;
2101         /*
2102          * Perform mapping of TCM scatterlist memory ib_sge dma_addr.
2103          */
2104         for_each_sg(sg_start, tmp_sg, sg_nents, i) {
2105                 pr_debug("ISER RDMA from SGL dma_addr: 0x%16llx dma_len: %u, page_off: %u\n",
2106                          (unsigned long long)tmp_sg->dma_address,
2107                          tmp_sg->length, page_off);
2108
2109                 ib_sge->addr = ib_sg_dma_address(ib_dev, tmp_sg) + page_off;
2110                 ib_sge->length = min_t(u32, data_left,
2111                                 ib_sg_dma_len(ib_dev, tmp_sg) - page_off);
2112                 ib_sge->lkey = isert_conn->conn_mr->lkey;
2113
2114                 pr_debug("RDMA ib_sge: addr: 0x%16llx  length: %u lkey: %08x\n",
2115                          ib_sge->addr, ib_sge->length, ib_sge->lkey);
2116                 page_off = 0;
2117                 data_left -= ib_sge->length;
2118                 ib_sge++;
2119                 pr_debug("Incrementing ib_sge pointer to %p\n", ib_sge);
2120         }
2121
2122         pr_debug("Set outgoing sg_list: %p num_sg: %u from TCM SGLs\n",
2123                  send_wr->sg_list, send_wr->num_sge);
2124
2125         return sg_nents;
2126 }
2127
2128 static int
2129 isert_map_rdma(struct iscsi_conn *conn, struct iscsi_cmd *cmd,
2130                struct isert_rdma_wr *wr)
2131 {
2132         struct se_cmd *se_cmd = &cmd->se_cmd;
2133         struct isert_cmd *isert_cmd = iscsit_priv_cmd(cmd);
2134         struct isert_conn *isert_conn = (struct isert_conn *)conn->context;
2135         struct ib_device *ib_dev = isert_conn->conn_cm_id->device;
2136         struct ib_send_wr *send_wr;
2137         struct ib_sge *ib_sge;
2138         struct scatterlist *sg_start;
2139         u32 sg_off = 0, sg_nents;
2140         u32 offset = 0, data_len, data_left, rdma_write_max, va_offset = 0;
2141         int ret = 0, count, i, ib_sge_cnt;
2142
2143         if (wr->iser_ib_op == ISER_IB_RDMA_WRITE) {
2144                 data_left = se_cmd->data_length;
2145         } else {
2146                 sg_off = cmd->write_data_done / PAGE_SIZE;
2147                 data_left = se_cmd->data_length - cmd->write_data_done;
2148                 offset = cmd->write_data_done;
2149                 isert_cmd->tx_desc.isert_cmd = isert_cmd;
2150         }
2151
2152         sg_start = &cmd->se_cmd.t_data_sg[sg_off];
2153         sg_nents = se_cmd->t_data_nents - sg_off;
2154
2155         count = ib_dma_map_sg(ib_dev, sg_start, sg_nents,
2156                               (wr->iser_ib_op == ISER_IB_RDMA_WRITE) ?
2157                               DMA_TO_DEVICE : DMA_FROM_DEVICE);
2158         if (unlikely(!count)) {
2159                 pr_err("Cmd: %p unrable to map SGs\n", isert_cmd);
2160                 return -EINVAL;
2161         }
2162         wr->sge = sg_start;
2163         wr->num_sge = sg_nents;
2164         wr->cur_rdma_length = data_left;
2165         pr_debug("Mapped cmd: %p count: %u sg: %p sg_nents: %u rdma_len %d\n",
2166                  isert_cmd, count, sg_start, sg_nents, data_left);
2167
2168         ib_sge = kzalloc(sizeof(struct ib_sge) * sg_nents, GFP_KERNEL);
2169         if (!ib_sge) {
2170                 pr_warn("Unable to allocate ib_sge\n");
2171                 ret = -ENOMEM;
2172                 goto unmap_sg;
2173         }
2174         wr->ib_sge = ib_sge;
2175
2176         wr->send_wr_num = DIV_ROUND_UP(sg_nents, isert_conn->max_sge);
2177         wr->send_wr = kzalloc(sizeof(struct ib_send_wr) * wr->send_wr_num,
2178                                 GFP_KERNEL);
2179         if (!wr->send_wr) {
2180                 pr_debug("Unable to allocate wr->send_wr\n");
2181                 ret = -ENOMEM;
2182                 goto unmap_sg;
2183         }
2184
2185         wr->isert_cmd = isert_cmd;
2186         rdma_write_max = isert_conn->max_sge * PAGE_SIZE;
2187
2188         for (i = 0; i < wr->send_wr_num; i++) {
2189                 send_wr = &isert_cmd->rdma_wr.send_wr[i];
2190                 data_len = min(data_left, rdma_write_max);
2191
2192                 send_wr->send_flags = 0;
2193                 if (wr->iser_ib_op == ISER_IB_RDMA_WRITE) {
2194                         send_wr->opcode = IB_WR_RDMA_WRITE;
2195                         send_wr->wr.rdma.remote_addr = isert_cmd->read_va + offset;
2196                         send_wr->wr.rdma.rkey = isert_cmd->read_stag;
2197                         if (i + 1 == wr->send_wr_num)
2198                                 send_wr->next = &isert_cmd->tx_desc.send_wr;
2199                         else
2200                                 send_wr->next = &wr->send_wr[i + 1];
2201                 } else {
2202                         send_wr->opcode = IB_WR_RDMA_READ;
2203                         send_wr->wr.rdma.remote_addr = isert_cmd->write_va + va_offset;
2204                         send_wr->wr.rdma.rkey = isert_cmd->write_stag;
2205                         if (i + 1 == wr->send_wr_num)
2206                                 send_wr->send_flags = IB_SEND_SIGNALED;
2207                         else
2208                                 send_wr->next = &wr->send_wr[i + 1];
2209                 }
2210
2211                 ib_sge_cnt = isert_build_rdma_wr(isert_conn, isert_cmd, ib_sge,
2212                                         send_wr, data_len, offset);
2213                 ib_sge += ib_sge_cnt;
2214
2215                 offset += data_len;
2216                 va_offset += data_len;
2217                 data_left -= data_len;
2218         }
2219
2220         return 0;
2221 unmap_sg:
2222         ib_dma_unmap_sg(ib_dev, sg_start, sg_nents,
2223                         (wr->iser_ib_op == ISER_IB_RDMA_WRITE) ?
2224                         DMA_TO_DEVICE : DMA_FROM_DEVICE);
2225         return ret;
2226 }
2227
2228 static int
2229 isert_map_fr_pagelist(struct ib_device *ib_dev,
2230                       struct scatterlist *sg_start, int sg_nents, u64 *fr_pl)
2231 {
2232         u64 start_addr, end_addr, page, chunk_start = 0;
2233         struct scatterlist *tmp_sg;
2234         int i = 0, new_chunk, last_ent, n_pages;
2235
2236         n_pages = 0;
2237         new_chunk = 1;
2238         last_ent = sg_nents - 1;
2239         for_each_sg(sg_start, tmp_sg, sg_nents, i) {
2240                 start_addr = ib_sg_dma_address(ib_dev, tmp_sg);
2241                 if (new_chunk)
2242                         chunk_start = start_addr;
2243                 end_addr = start_addr + ib_sg_dma_len(ib_dev, tmp_sg);
2244
2245                 pr_debug("SGL[%d] dma_addr: 0x%16llx len: %u\n",
2246                          i, (unsigned long long)tmp_sg->dma_address,
2247                          tmp_sg->length);
2248
2249                 if ((end_addr & ~PAGE_MASK) && i < last_ent) {
2250                         new_chunk = 0;
2251                         continue;
2252                 }
2253                 new_chunk = 1;
2254
2255                 page = chunk_start & PAGE_MASK;
2256                 do {
2257                         fr_pl[n_pages++] = page;
2258                         pr_debug("Mapped page_list[%d] page_addr: 0x%16llx\n",
2259                                  n_pages - 1, page);
2260                         page += PAGE_SIZE;
2261                 } while (page < end_addr);
2262         }
2263
2264         return n_pages;
2265 }
2266
2267 static int
2268 isert_fast_reg_mr(struct fast_reg_descriptor *fr_desc,
2269                   struct isert_conn *isert_conn, struct scatterlist *sg_start,
2270                   struct ib_sge *ib_sge, u32 sg_nents, u32 offset,
2271                   unsigned int data_len)
2272 {
2273         struct ib_device *ib_dev = isert_conn->conn_cm_id->device;
2274         struct ib_send_wr fr_wr, inv_wr;
2275         struct ib_send_wr *bad_wr, *wr = NULL;
2276         int ret, pagelist_len;
2277         u32 page_off;
2278         u8 key;
2279
2280         sg_nents = min_t(unsigned int, sg_nents, ISCSI_ISER_SG_TABLESIZE);
2281         page_off = offset % PAGE_SIZE;
2282
2283         pr_debug("Use fr_desc %p sg_nents %d offset %u\n",
2284                  fr_desc, sg_nents, offset);
2285
2286         pagelist_len = isert_map_fr_pagelist(ib_dev, sg_start, sg_nents,
2287                                              &fr_desc->data_frpl->page_list[0]);
2288
2289         if (!fr_desc->valid) {
2290                 memset(&inv_wr, 0, sizeof(inv_wr));
2291                 inv_wr.wr_id = ISER_FASTREG_LI_WRID;
2292                 inv_wr.opcode = IB_WR_LOCAL_INV;
2293                 inv_wr.ex.invalidate_rkey = fr_desc->data_mr->rkey;
2294                 wr = &inv_wr;
2295                 /* Bump the key */
2296                 key = (u8)(fr_desc->data_mr->rkey & 0x000000FF);
2297                 ib_update_fast_reg_key(fr_desc->data_mr, ++key);
2298         }
2299
2300         /* Prepare FASTREG WR */
2301         memset(&fr_wr, 0, sizeof(fr_wr));
2302         fr_wr.wr_id = ISER_FASTREG_LI_WRID;
2303         fr_wr.opcode = IB_WR_FAST_REG_MR;
2304         fr_wr.wr.fast_reg.iova_start =
2305                 fr_desc->data_frpl->page_list[0] + page_off;
2306         fr_wr.wr.fast_reg.page_list = fr_desc->data_frpl;
2307         fr_wr.wr.fast_reg.page_list_len = pagelist_len;
2308         fr_wr.wr.fast_reg.page_shift = PAGE_SHIFT;
2309         fr_wr.wr.fast_reg.length = data_len;
2310         fr_wr.wr.fast_reg.rkey = fr_desc->data_mr->rkey;
2311         fr_wr.wr.fast_reg.access_flags = IB_ACCESS_LOCAL_WRITE;
2312
2313         if (!wr)
2314                 wr = &fr_wr;
2315         else
2316                 wr->next = &fr_wr;
2317
2318         ret = ib_post_send(isert_conn->conn_qp, wr, &bad_wr);
2319         if (ret) {
2320                 pr_err("fast registration failed, ret:%d\n", ret);
2321                 return ret;
2322         }
2323         fr_desc->valid = false;
2324
2325         ib_sge->lkey = fr_desc->data_mr->lkey;
2326         ib_sge->addr = fr_desc->data_frpl->page_list[0] + page_off;
2327         ib_sge->length = data_len;
2328
2329         pr_debug("RDMA ib_sge: addr: 0x%16llx  length: %u lkey: %08x\n",
2330                  ib_sge->addr, ib_sge->length, ib_sge->lkey);
2331
2332         return ret;
2333 }
2334
2335 static int
2336 isert_reg_rdma(struct iscsi_conn *conn, struct iscsi_cmd *cmd,
2337                struct isert_rdma_wr *wr)
2338 {
2339         struct se_cmd *se_cmd = &cmd->se_cmd;
2340         struct isert_cmd *isert_cmd = iscsit_priv_cmd(cmd);
2341         struct isert_conn *isert_conn = (struct isert_conn *)conn->context;
2342         struct ib_device *ib_dev = isert_conn->conn_cm_id->device;
2343         struct ib_send_wr *send_wr;
2344         struct ib_sge *ib_sge;
2345         struct scatterlist *sg_start;
2346         struct fast_reg_descriptor *fr_desc;
2347         u32 sg_off = 0, sg_nents;
2348         u32 offset = 0, data_len, data_left, rdma_write_max;
2349         int ret = 0, count;
2350         unsigned long flags;
2351
2352         if (wr->iser_ib_op == ISER_IB_RDMA_WRITE) {
2353                 data_left = se_cmd->data_length;
2354         } else {
2355                 offset = cmd->write_data_done;
2356                 sg_off = offset / PAGE_SIZE;
2357                 data_left = se_cmd->data_length - cmd->write_data_done;
2358                 isert_cmd->tx_desc.isert_cmd = isert_cmd;
2359         }
2360
2361         sg_start = &cmd->se_cmd.t_data_sg[sg_off];
2362         sg_nents = se_cmd->t_data_nents - sg_off;
2363
2364         count = ib_dma_map_sg(ib_dev, sg_start, sg_nents,
2365                               (wr->iser_ib_op == ISER_IB_RDMA_WRITE) ?
2366                               DMA_TO_DEVICE : DMA_FROM_DEVICE);
2367         if (unlikely(!count)) {
2368                 pr_err("Cmd: %p unrable to map SGs\n", isert_cmd);
2369                 return -EINVAL;
2370         }
2371         wr->sge = sg_start;
2372         wr->num_sge = sg_nents;
2373         pr_debug("Mapped cmd: %p count: %u sg: %p sg_nents: %u rdma_len %d\n",
2374                  isert_cmd, count, sg_start, sg_nents, data_left);
2375
2376         memset(&wr->s_ib_sge, 0, sizeof(*ib_sge));
2377         ib_sge = &wr->s_ib_sge;
2378         wr->ib_sge = ib_sge;
2379
2380         wr->send_wr_num = 1;
2381         memset(&wr->s_send_wr, 0, sizeof(*send_wr));
2382         wr->send_wr = &wr->s_send_wr;
2383
2384         wr->isert_cmd = isert_cmd;
2385         rdma_write_max = ISCSI_ISER_SG_TABLESIZE * PAGE_SIZE;
2386
2387         send_wr = &isert_cmd->rdma_wr.s_send_wr;
2388         send_wr->sg_list = ib_sge;
2389         send_wr->num_sge = 1;
2390         send_wr->wr_id = (unsigned long)&isert_cmd->tx_desc;
2391         if (wr->iser_ib_op == ISER_IB_RDMA_WRITE) {
2392                 send_wr->opcode = IB_WR_RDMA_WRITE;
2393                 send_wr->wr.rdma.remote_addr = isert_cmd->read_va;
2394                 send_wr->wr.rdma.rkey = isert_cmd->read_stag;
2395                 send_wr->send_flags = 0;
2396                 send_wr->next = &isert_cmd->tx_desc.send_wr;
2397         } else {
2398                 send_wr->opcode = IB_WR_RDMA_READ;
2399                 send_wr->wr.rdma.remote_addr = isert_cmd->write_va;
2400                 send_wr->wr.rdma.rkey = isert_cmd->write_stag;
2401                 send_wr->send_flags = IB_SEND_SIGNALED;
2402         }
2403
2404         data_len = min(data_left, rdma_write_max);
2405         wr->cur_rdma_length = data_len;
2406
2407         /* if there is a single dma entry, dma mr is sufficient */
2408         if (count == 1) {
2409                 ib_sge->addr = ib_sg_dma_address(ib_dev, &sg_start[0]);
2410                 ib_sge->length = ib_sg_dma_len(ib_dev, &sg_start[0]);
2411                 ib_sge->lkey = isert_conn->conn_mr->lkey;
2412                 wr->fr_desc = NULL;
2413         } else {
2414                 spin_lock_irqsave(&isert_conn->conn_lock, flags);
2415                 fr_desc = list_first_entry(&isert_conn->conn_fr_pool,
2416                                            struct fast_reg_descriptor, list);
2417                 list_del(&fr_desc->list);
2418                 spin_unlock_irqrestore(&isert_conn->conn_lock, flags);
2419                 wr->fr_desc = fr_desc;
2420
2421                 ret = isert_fast_reg_mr(fr_desc, isert_conn, sg_start,
2422                                         ib_sge, sg_nents, offset, data_len);
2423                 if (ret) {
2424                         list_add_tail(&fr_desc->list, &isert_conn->conn_fr_pool);
2425                         goto unmap_sg;
2426                 }
2427         }
2428
2429         return 0;
2430
2431 unmap_sg:
2432         ib_dma_unmap_sg(ib_dev, sg_start, sg_nents,
2433                         (wr->iser_ib_op == ISER_IB_RDMA_WRITE) ?
2434                         DMA_TO_DEVICE : DMA_FROM_DEVICE);
2435         return ret;
2436 }
2437
2438 static int
2439 isert_put_datain(struct iscsi_conn *conn, struct iscsi_cmd *cmd)
2440 {
2441         struct se_cmd *se_cmd = &cmd->se_cmd;
2442         struct isert_cmd *isert_cmd = iscsit_priv_cmd(cmd);
2443         struct isert_rdma_wr *wr = &isert_cmd->rdma_wr;
2444         struct isert_conn *isert_conn = (struct isert_conn *)conn->context;
2445         struct isert_device *device = isert_conn->conn_device;
2446         struct ib_send_wr *wr_failed;
2447         int rc;
2448
2449         pr_debug("Cmd: %p RDMA_WRITE data_length: %u\n",
2450                  isert_cmd, se_cmd->data_length);
2451         wr->iser_ib_op = ISER_IB_RDMA_WRITE;
2452         rc = device->reg_rdma_mem(conn, cmd, wr);
2453         if (rc) {
2454                 pr_err("Cmd: %p failed to prepare RDMA res\n", isert_cmd);
2455                 return rc;
2456         }
2457
2458         /*
2459          * Build isert_conn->tx_desc for iSCSI response PDU and attach
2460          */
2461         isert_create_send_desc(isert_conn, isert_cmd, &isert_cmd->tx_desc);
2462         iscsit_build_rsp_pdu(cmd, conn, true, (struct iscsi_scsi_rsp *)
2463                              &isert_cmd->tx_desc.iscsi_header);
2464         isert_init_tx_hdrs(isert_conn, &isert_cmd->tx_desc);
2465         isert_init_send_wr(isert_conn, isert_cmd,
2466                            &isert_cmd->tx_desc.send_wr, true);
2467
2468         atomic_add(wr->send_wr_num + 1, &isert_conn->post_send_buf_count);
2469
2470         rc = ib_post_send(isert_conn->conn_qp, wr->send_wr, &wr_failed);
2471         if (rc) {
2472                 pr_warn("ib_post_send() failed for IB_WR_RDMA_WRITE\n");
2473                 atomic_sub(wr->send_wr_num + 1, &isert_conn->post_send_buf_count);
2474         }
2475         pr_debug("Cmd: %p posted RDMA_WRITE + Response for iSER Data READ\n",
2476                  isert_cmd);
2477
2478         return 1;
2479 }
2480
2481 static int
2482 isert_get_dataout(struct iscsi_conn *conn, struct iscsi_cmd *cmd, bool recovery)
2483 {
2484         struct se_cmd *se_cmd = &cmd->se_cmd;
2485         struct isert_cmd *isert_cmd = iscsit_priv_cmd(cmd);
2486         struct isert_rdma_wr *wr = &isert_cmd->rdma_wr;
2487         struct isert_conn *isert_conn = (struct isert_conn *)conn->context;
2488         struct isert_device *device = isert_conn->conn_device;
2489         struct ib_send_wr *wr_failed;
2490         int rc;
2491
2492         pr_debug("Cmd: %p RDMA_READ data_length: %u write_data_done: %u\n",
2493                  isert_cmd, se_cmd->data_length, cmd->write_data_done);
2494         wr->iser_ib_op = ISER_IB_RDMA_READ;
2495         rc = device->reg_rdma_mem(conn, cmd, wr);
2496         if (rc) {
2497                 pr_err("Cmd: %p failed to prepare RDMA res\n", isert_cmd);
2498                 return rc;
2499         }
2500
2501         atomic_add(wr->send_wr_num, &isert_conn->post_send_buf_count);
2502
2503         rc = ib_post_send(isert_conn->conn_qp, wr->send_wr, &wr_failed);
2504         if (rc) {
2505                 pr_warn("ib_post_send() failed for IB_WR_RDMA_READ\n");
2506                 atomic_sub(wr->send_wr_num, &isert_conn->post_send_buf_count);
2507         }
2508         pr_debug("Cmd: %p posted RDMA_READ memory for ISER Data WRITE\n",
2509                  isert_cmd);
2510
2511         return 0;
2512 }
2513
2514 static int
2515 isert_immediate_queue(struct iscsi_conn *conn, struct iscsi_cmd *cmd, int state)
2516 {
2517         int ret;
2518
2519         switch (state) {
2520         case ISTATE_SEND_NOPIN_WANT_RESPONSE:
2521                 ret = isert_put_nopin(cmd, conn, false);
2522                 break;
2523         default:
2524                 pr_err("Unknown immediate state: 0x%02x\n", state);
2525                 ret = -EINVAL;
2526                 break;
2527         }
2528
2529         return ret;
2530 }
2531
2532 static int
2533 isert_response_queue(struct iscsi_conn *conn, struct iscsi_cmd *cmd, int state)
2534 {
2535         int ret;
2536
2537         switch (state) {
2538         case ISTATE_SEND_LOGOUTRSP:
2539                 ret = isert_put_logout_rsp(cmd, conn);
2540                 if (!ret) {
2541                         pr_debug("Returning iSER Logout -EAGAIN\n");
2542                         ret = -EAGAIN;
2543                 }
2544                 break;
2545         case ISTATE_SEND_NOPIN:
2546                 ret = isert_put_nopin(cmd, conn, true);
2547                 break;
2548         case ISTATE_SEND_TASKMGTRSP:
2549                 ret = isert_put_tm_rsp(cmd, conn);
2550                 break;
2551         case ISTATE_SEND_REJECT:
2552                 ret = isert_put_reject(cmd, conn);
2553                 break;
2554         case ISTATE_SEND_TEXTRSP:
2555                 ret = isert_put_text_rsp(cmd, conn);
2556                 break;
2557         case ISTATE_SEND_STATUS:
2558                 /*
2559                  * Special case for sending non GOOD SCSI status from TX thread
2560                  * context during pre se_cmd excecution failure.
2561                  */
2562                 ret = isert_put_response(conn, cmd);
2563                 break;
2564         default:
2565                 pr_err("Unknown response state: 0x%02x\n", state);
2566                 ret = -EINVAL;
2567                 break;
2568         }
2569
2570         return ret;
2571 }
2572
2573 static int
2574 isert_setup_np(struct iscsi_np *np,
2575                struct __kernel_sockaddr_storage *ksockaddr)
2576 {
2577         struct isert_np *isert_np;
2578         struct rdma_cm_id *isert_lid;
2579         struct sockaddr *sa;
2580         int ret;
2581
2582         isert_np = kzalloc(sizeof(struct isert_np), GFP_KERNEL);
2583         if (!isert_np) {
2584                 pr_err("Unable to allocate struct isert_np\n");
2585                 return -ENOMEM;
2586         }
2587         sema_init(&isert_np->np_sem, 0);
2588         mutex_init(&isert_np->np_accept_mutex);
2589         INIT_LIST_HEAD(&isert_np->np_accept_list);
2590         init_completion(&isert_np->np_login_comp);
2591
2592         sa = (struct sockaddr *)ksockaddr;
2593         pr_debug("ksockaddr: %p, sa: %p\n", ksockaddr, sa);
2594         /*
2595          * Setup the np->np_sockaddr from the passed sockaddr setup
2596          * in iscsi_target_configfs.c code..
2597          */
2598         memcpy(&np->np_sockaddr, ksockaddr,
2599                sizeof(struct __kernel_sockaddr_storage));
2600
2601         isert_lid = rdma_create_id(isert_cma_handler, np, RDMA_PS_TCP,
2602                                 IB_QPT_RC);
2603         if (IS_ERR(isert_lid)) {
2604                 pr_err("rdma_create_id() for isert_listen_handler failed: %ld\n",
2605                        PTR_ERR(isert_lid));
2606                 ret = PTR_ERR(isert_lid);
2607                 goto out;
2608         }
2609
2610         ret = rdma_bind_addr(isert_lid, sa);
2611         if (ret) {
2612                 pr_err("rdma_bind_addr() for isert_lid failed: %d\n", ret);
2613                 goto out_lid;
2614         }
2615
2616         ret = rdma_listen(isert_lid, ISERT_RDMA_LISTEN_BACKLOG);
2617         if (ret) {
2618                 pr_err("rdma_listen() for isert_lid failed: %d\n", ret);
2619                 goto out_lid;
2620         }
2621
2622         isert_np->np_cm_id = isert_lid;
2623         np->np_context = isert_np;
2624         pr_debug("Setup isert_lid->context: %p\n", isert_lid->context);
2625
2626         return 0;
2627
2628 out_lid:
2629         rdma_destroy_id(isert_lid);
2630 out:
2631         kfree(isert_np);
2632         return ret;
2633 }
2634
2635 static int
2636 isert_rdma_accept(struct isert_conn *isert_conn)
2637 {
2638         struct rdma_cm_id *cm_id = isert_conn->conn_cm_id;
2639         struct rdma_conn_param cp;
2640         int ret;
2641
2642         memset(&cp, 0, sizeof(struct rdma_conn_param));
2643         cp.responder_resources = isert_conn->responder_resources;
2644         cp.initiator_depth = isert_conn->initiator_depth;
2645         cp.retry_count = 7;
2646         cp.rnr_retry_count = 7;
2647
2648         pr_debug("Before rdma_accept >>>>>>>>>>>>>>>>>>>>.\n");
2649
2650         ret = rdma_accept(cm_id, &cp);
2651         if (ret) {
2652                 pr_err("rdma_accept() failed with: %d\n", ret);
2653                 return ret;
2654         }
2655
2656         pr_debug("After rdma_accept >>>>>>>>>>>>>>>>>>>>>.\n");
2657
2658         return 0;
2659 }
2660
2661 static int
2662 isert_get_login_rx(struct iscsi_conn *conn, struct iscsi_login *login)
2663 {
2664         struct isert_conn *isert_conn = (struct isert_conn *)conn->context;
2665         int ret;
2666
2667         pr_debug("isert_get_login_rx before conn_login_comp conn: %p\n", conn);
2668         /*
2669          * For login requests after the first PDU, isert_rx_login_req() will
2670          * kick schedule_delayed_work(&conn->login_work) as the packet is
2671          * received, which turns this callback from iscsi_target_do_login_rx()
2672          * into a NOP.
2673          */
2674         if (!login->first_request)
2675                 return 0;
2676
2677         ret = wait_for_completion_interruptible(&isert_conn->conn_login_comp);
2678         if (ret)
2679                 return ret;
2680
2681         pr_debug("isert_get_login_rx processing login->req: %p\n", login->req);
2682         return 0;
2683 }
2684
2685 static void
2686 isert_set_conn_info(struct iscsi_np *np, struct iscsi_conn *conn,
2687                     struct isert_conn *isert_conn)
2688 {
2689         struct rdma_cm_id *cm_id = isert_conn->conn_cm_id;
2690         struct rdma_route *cm_route = &cm_id->route;
2691         struct sockaddr_in *sock_in;
2692         struct sockaddr_in6 *sock_in6;
2693
2694         conn->login_family = np->np_sockaddr.ss_family;
2695
2696         if (np->np_sockaddr.ss_family == AF_INET6) {
2697                 sock_in6 = (struct sockaddr_in6 *)&cm_route->addr.dst_addr;
2698                 snprintf(conn->login_ip, sizeof(conn->login_ip), "%pI6c",
2699                          &sock_in6->sin6_addr.in6_u);
2700                 conn->login_port = ntohs(sock_in6->sin6_port);
2701
2702                 sock_in6 = (struct sockaddr_in6 *)&cm_route->addr.src_addr;
2703                 snprintf(conn->local_ip, sizeof(conn->local_ip), "%pI6c",
2704                          &sock_in6->sin6_addr.in6_u);
2705                 conn->local_port = ntohs(sock_in6->sin6_port);
2706         } else {
2707                 sock_in = (struct sockaddr_in *)&cm_route->addr.dst_addr;
2708                 sprintf(conn->login_ip, "%pI4",
2709                         &sock_in->sin_addr.s_addr);
2710                 conn->login_port = ntohs(sock_in->sin_port);
2711
2712                 sock_in = (struct sockaddr_in *)&cm_route->addr.src_addr;
2713                 sprintf(conn->local_ip, "%pI4",
2714                         &sock_in->sin_addr.s_addr);
2715                 conn->local_port = ntohs(sock_in->sin_port);
2716         }
2717 }
2718
2719 static int
2720 isert_accept_np(struct iscsi_np *np, struct iscsi_conn *conn)
2721 {
2722         struct isert_np *isert_np = (struct isert_np *)np->np_context;
2723         struct isert_conn *isert_conn;
2724         int max_accept = 0, ret;
2725
2726 accept_wait:
2727         ret = down_interruptible(&isert_np->np_sem);
2728         if (max_accept > 5)
2729                 return -ENODEV;
2730
2731         spin_lock_bh(&np->np_thread_lock);
2732         if (np->np_thread_state >= ISCSI_NP_THREAD_RESET) {
2733                 spin_unlock_bh(&np->np_thread_lock);
2734                 pr_debug("np_thread_state %d for isert_accept_np\n",
2735                          np->np_thread_state);
2736                 /**
2737                  * No point in stalling here when np_thread
2738                  * is in state RESET/SHUTDOWN/EXIT - bail
2739                  **/
2740                 return -ENODEV;
2741         }
2742         spin_unlock_bh(&np->np_thread_lock);
2743
2744         mutex_lock(&isert_np->np_accept_mutex);
2745         if (list_empty(&isert_np->np_accept_list)) {
2746                 mutex_unlock(&isert_np->np_accept_mutex);
2747                 max_accept++;
2748                 goto accept_wait;
2749         }
2750         isert_conn = list_first_entry(&isert_np->np_accept_list,
2751                         struct isert_conn, conn_accept_node);
2752         list_del_init(&isert_conn->conn_accept_node);
2753         mutex_unlock(&isert_np->np_accept_mutex);
2754
2755         conn->context = isert_conn;
2756         isert_conn->conn = conn;
2757         max_accept = 0;
2758
2759         ret = isert_rdma_post_recvl(isert_conn);
2760         if (ret)
2761                 return ret;
2762
2763         ret = isert_rdma_accept(isert_conn);
2764         if (ret)
2765                 return ret;
2766
2767         isert_set_conn_info(np, conn, isert_conn);
2768
2769         pr_debug("Processing isert_accept_np: isert_conn: %p\n", isert_conn);
2770         return 0;
2771 }
2772
2773 static void
2774 isert_free_np(struct iscsi_np *np)
2775 {
2776         struct isert_np *isert_np = (struct isert_np *)np->np_context;
2777
2778         rdma_destroy_id(isert_np->np_cm_id);
2779
2780         np->np_context = NULL;
2781         kfree(isert_np);
2782 }
2783
2784 static void isert_wait_conn(struct iscsi_conn *conn)
2785 {
2786         struct isert_conn *isert_conn = conn->context;
2787
2788         pr_debug("isert_wait_conn: Starting \n");
2789
2790         mutex_lock(&isert_conn->conn_mutex);
2791         if (isert_conn->conn_cm_id) {
2792                 pr_debug("Calling rdma_disconnect from isert_wait_conn\n");
2793                 rdma_disconnect(isert_conn->conn_cm_id);
2794         }
2795         /*
2796          * Only wait for conn_wait_comp_err if the isert_conn made it
2797          * into full feature phase..
2798          */
2799         if (isert_conn->state == ISER_CONN_INIT) {
2800                 mutex_unlock(&isert_conn->conn_mutex);
2801                 return;
2802         }
2803         if (isert_conn->state == ISER_CONN_UP)
2804                 isert_conn->state = ISER_CONN_TERMINATING;
2805         mutex_unlock(&isert_conn->conn_mutex);
2806
2807         wait_for_completion(&isert_conn->conn_wait_comp_err);
2808
2809         wait_for_completion(&isert_conn->conn_wait);
2810         isert_put_conn(isert_conn);
2811 }
2812
2813 static void isert_free_conn(struct iscsi_conn *conn)
2814 {
2815         struct isert_conn *isert_conn = conn->context;
2816
2817         isert_put_conn(isert_conn);
2818 }
2819
2820 static struct iscsit_transport iser_target_transport = {
2821         .name                   = "IB/iSER",
2822         .transport_type         = ISCSI_INFINIBAND,
2823         .priv_size              = sizeof(struct isert_cmd),
2824         .owner                  = THIS_MODULE,
2825         .iscsit_setup_np        = isert_setup_np,
2826         .iscsit_accept_np       = isert_accept_np,
2827         .iscsit_free_np         = isert_free_np,
2828         .iscsit_wait_conn       = isert_wait_conn,
2829         .iscsit_free_conn       = isert_free_conn,
2830         .iscsit_get_login_rx    = isert_get_login_rx,
2831         .iscsit_put_login_tx    = isert_put_login_tx,
2832         .iscsit_immediate_queue = isert_immediate_queue,
2833         .iscsit_response_queue  = isert_response_queue,
2834         .iscsit_get_dataout     = isert_get_dataout,
2835         .iscsit_queue_data_in   = isert_put_datain,
2836         .iscsit_queue_status    = isert_put_response,
2837 };
2838
2839 static int __init isert_init(void)
2840 {
2841         int ret;
2842
2843         isert_rx_wq = alloc_workqueue("isert_rx_wq", 0, 0);
2844         if (!isert_rx_wq) {
2845                 pr_err("Unable to allocate isert_rx_wq\n");
2846                 return -ENOMEM;
2847         }
2848
2849         isert_comp_wq = alloc_workqueue("isert_comp_wq", 0, 0);
2850         if (!isert_comp_wq) {
2851                 pr_err("Unable to allocate isert_comp_wq\n");
2852                 ret = -ENOMEM;
2853                 goto destroy_rx_wq;
2854         }
2855
2856         iscsit_register_transport(&iser_target_transport);
2857         pr_debug("iSER_TARGET[0] - Loaded iser_target_transport\n");
2858         return 0;
2859
2860 destroy_rx_wq:
2861         destroy_workqueue(isert_rx_wq);
2862         return ret;
2863 }
2864
2865 static void __exit isert_exit(void)
2866 {
2867         flush_scheduled_work();
2868         destroy_workqueue(isert_comp_wq);
2869         destroy_workqueue(isert_rx_wq);
2870         iscsit_unregister_transport(&iser_target_transport);
2871         pr_debug("iSER_TARGET[0] - Released iser_target_transport\n");
2872 }
2873
2874 MODULE_DESCRIPTION("iSER-Target for mainline target infrastructure");
2875 MODULE_VERSION("0.1");
2876 MODULE_AUTHOR("nab@Linux-iSCSI.org");
2877 MODULE_LICENSE("GPL");
2878
2879 module_init(isert_init);
2880 module_exit(isert_exit);