[GFS2] Fix up merge of Linus' kernel into GFS2
[pandora-kernel.git] / drivers / infiniband / hw / amso1100 / c2_qp.c
1 /*
2  * Copyright (c) 2004 Topspin Communications.  All rights reserved.
3  * Copyright (c) 2005 Cisco Systems. All rights reserved.
4  * Copyright (c) 2005 Mellanox Technologies. All rights reserved.
5  * Copyright (c) 2004 Voltaire, Inc. All rights reserved.
6  * Copyright (c) 2005 Open Grid Computing, Inc. All rights reserved.
7  *
8  * This software is available to you under a choice of one of two
9  * licenses.  You may choose to be licensed under the terms of the GNU
10  * General Public License (GPL) Version 2, available from the file
11  * COPYING in the main directory of this source tree, or the
12  * OpenIB.org BSD license below:
13  *
14  *     Redistribution and use in source and binary forms, with or
15  *     without modification, are permitted provided that the following
16  *     conditions are met:
17  *
18  *      - Redistributions of source code must retain the above
19  *        copyright notice, this list of conditions and the following
20  *        disclaimer.
21  *
22  *      - Redistributions in binary form must reproduce the above
23  *        copyright notice, this list of conditions and the following
24  *        disclaimer in the documentation and/or other materials
25  *        provided with the distribution.
26  *
27  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
28  * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
29  * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
30  * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
31  * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
32  * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
33  * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
34  * SOFTWARE.
35  *
36  */
37
38 #include "c2.h"
39 #include "c2_vq.h"
40 #include "c2_status.h"
41
42 #define C2_MAX_ORD_PER_QP 128
43 #define C2_MAX_IRD_PER_QP 128
44
45 #define C2_HINT_MAKE(q_index, hint_count) (((q_index) << 16) | hint_count)
46 #define C2_HINT_GET_INDEX(hint) (((hint) & 0x7FFF0000) >> 16)
47 #define C2_HINT_GET_COUNT(hint) ((hint) & 0x0000FFFF)
48
49 #define NO_SUPPORT -1
50 static const u8 c2_opcode[] = {
51         [IB_WR_SEND] = C2_WR_TYPE_SEND,
52         [IB_WR_SEND_WITH_IMM] = NO_SUPPORT,
53         [IB_WR_RDMA_WRITE] = C2_WR_TYPE_RDMA_WRITE,
54         [IB_WR_RDMA_WRITE_WITH_IMM] = NO_SUPPORT,
55         [IB_WR_RDMA_READ] = C2_WR_TYPE_RDMA_READ,
56         [IB_WR_ATOMIC_CMP_AND_SWP] = NO_SUPPORT,
57         [IB_WR_ATOMIC_FETCH_AND_ADD] = NO_SUPPORT,
58 };
59
60 static int to_c2_state(enum ib_qp_state ib_state)
61 {
62         switch (ib_state) {
63         case IB_QPS_RESET:
64                 return C2_QP_STATE_IDLE;
65         case IB_QPS_RTS:
66                 return C2_QP_STATE_RTS;
67         case IB_QPS_SQD:
68                 return C2_QP_STATE_CLOSING;
69         case IB_QPS_SQE:
70                 return C2_QP_STATE_CLOSING;
71         case IB_QPS_ERR:
72                 return C2_QP_STATE_ERROR;
73         default:
74                 return -1;
75         }
76 }
77
78 static int to_ib_state(enum c2_qp_state c2_state)
79 {
80         switch (c2_state) {
81         case C2_QP_STATE_IDLE:
82                 return IB_QPS_RESET;
83         case C2_QP_STATE_CONNECTING:
84                 return IB_QPS_RTR;
85         case C2_QP_STATE_RTS:
86                 return IB_QPS_RTS;
87         case C2_QP_STATE_CLOSING:
88                 return IB_QPS_SQD;
89         case C2_QP_STATE_ERROR:
90                 return IB_QPS_ERR;
91         case C2_QP_STATE_TERMINATE:
92                 return IB_QPS_SQE;
93         default:
94                 return -1;
95         }
96 }
97
98 static const char *to_ib_state_str(int ib_state)
99 {
100         static const char *state_str[] = {
101                 "IB_QPS_RESET",
102                 "IB_QPS_INIT",
103                 "IB_QPS_RTR",
104                 "IB_QPS_RTS",
105                 "IB_QPS_SQD",
106                 "IB_QPS_SQE",
107                 "IB_QPS_ERR"
108         };
109         if (ib_state < IB_QPS_RESET ||
110             ib_state > IB_QPS_ERR)
111                 return "<invalid IB QP state>";
112
113         ib_state -= IB_QPS_RESET;
114         return state_str[ib_state];
115 }
116
117 void c2_set_qp_state(struct c2_qp *qp, int c2_state)
118 {
119         int new_state = to_ib_state(c2_state);
120
121         pr_debug("%s: qp[%p] state modify %s --> %s\n",
122                __FUNCTION__,
123                 qp,
124                 to_ib_state_str(qp->state),
125                 to_ib_state_str(new_state));
126         qp->state = new_state;
127 }
128
129 #define C2_QP_NO_ATTR_CHANGE 0xFFFFFFFF
130
131 int c2_qp_modify(struct c2_dev *c2dev, struct c2_qp *qp,
132                  struct ib_qp_attr *attr, int attr_mask)
133 {
134         struct c2wr_qp_modify_req wr;
135         struct c2wr_qp_modify_rep *reply;
136         struct c2_vq_req *vq_req;
137         unsigned long flags;
138         u8 next_state;
139         int err;
140
141         pr_debug("%s:%d qp=%p, %s --> %s\n",
142                 __FUNCTION__, __LINE__,
143                 qp,
144                 to_ib_state_str(qp->state),
145                 to_ib_state_str(attr->qp_state));
146
147         vq_req = vq_req_alloc(c2dev);
148         if (!vq_req)
149                 return -ENOMEM;
150
151         c2_wr_set_id(&wr, CCWR_QP_MODIFY);
152         wr.hdr.context = (unsigned long) vq_req;
153         wr.rnic_handle = c2dev->adapter_handle;
154         wr.qp_handle = qp->adapter_handle;
155         wr.ord = cpu_to_be32(C2_QP_NO_ATTR_CHANGE);
156         wr.ird = cpu_to_be32(C2_QP_NO_ATTR_CHANGE);
157         wr.sq_depth = cpu_to_be32(C2_QP_NO_ATTR_CHANGE);
158         wr.rq_depth = cpu_to_be32(C2_QP_NO_ATTR_CHANGE);
159
160         if (attr_mask & IB_QP_STATE) {
161                 /* Ensure the state is valid */
162                 if (attr->qp_state < 0 || attr->qp_state > IB_QPS_ERR)
163                         return -EINVAL;
164
165                 wr.next_qp_state = cpu_to_be32(to_c2_state(attr->qp_state));
166
167                 if (attr->qp_state == IB_QPS_ERR) {
168                         spin_lock_irqsave(&qp->lock, flags);
169                         if (qp->cm_id && qp->state == IB_QPS_RTS) {
170                                 pr_debug("Generating CLOSE event for QP-->ERR, "
171                                         "qp=%p, cm_id=%p\n",qp,qp->cm_id);
172                                 /* Generate an CLOSE event */
173                                 vq_req->cm_id = qp->cm_id;
174                                 vq_req->event = IW_CM_EVENT_CLOSE;
175                         }
176                         spin_unlock_irqrestore(&qp->lock, flags);
177                 }
178                 next_state =  attr->qp_state;
179
180         } else if (attr_mask & IB_QP_CUR_STATE) {
181
182                 if (attr->cur_qp_state != IB_QPS_RTR &&
183                     attr->cur_qp_state != IB_QPS_RTS &&
184                     attr->cur_qp_state != IB_QPS_SQD &&
185                     attr->cur_qp_state != IB_QPS_SQE)
186                         return -EINVAL;
187                 else
188                         wr.next_qp_state =
189                             cpu_to_be32(to_c2_state(attr->cur_qp_state));
190
191                 next_state = attr->cur_qp_state;
192
193         } else {
194                 err = 0;
195                 goto bail0;
196         }
197
198         /* reference the request struct */
199         vq_req_get(c2dev, vq_req);
200
201         err = vq_send_wr(c2dev, (union c2wr *) & wr);
202         if (err) {
203                 vq_req_put(c2dev, vq_req);
204                 goto bail0;
205         }
206
207         err = vq_wait_for_reply(c2dev, vq_req);
208         if (err)
209                 goto bail0;
210
211         reply = (struct c2wr_qp_modify_rep *) (unsigned long) vq_req->reply_msg;
212         if (!reply) {
213                 err = -ENOMEM;
214                 goto bail0;
215         }
216
217         err = c2_errno(reply);
218         if (!err)
219                 qp->state = next_state;
220 #ifdef DEBUG
221         else
222                 pr_debug("%s: c2_errno=%d\n", __FUNCTION__, err);
223 #endif
224         /*
225          * If we're going to error and generating the event here, then
226          * we need to remove the reference because there will be no
227          * close event generated by the adapter
228         */
229         spin_lock_irqsave(&qp->lock, flags);
230         if (vq_req->event==IW_CM_EVENT_CLOSE && qp->cm_id) {
231                 qp->cm_id->rem_ref(qp->cm_id);
232                 qp->cm_id = NULL;
233         }
234         spin_unlock_irqrestore(&qp->lock, flags);
235
236         vq_repbuf_free(c2dev, reply);
237       bail0:
238         vq_req_free(c2dev, vq_req);
239
240         pr_debug("%s:%d qp=%p, cur_state=%s\n",
241                 __FUNCTION__, __LINE__,
242                 qp,
243                 to_ib_state_str(qp->state));
244         return err;
245 }
246
247 int c2_qp_set_read_limits(struct c2_dev *c2dev, struct c2_qp *qp,
248                           int ord, int ird)
249 {
250         struct c2wr_qp_modify_req wr;
251         struct c2wr_qp_modify_rep *reply;
252         struct c2_vq_req *vq_req;
253         int err;
254
255         vq_req = vq_req_alloc(c2dev);
256         if (!vq_req)
257                 return -ENOMEM;
258
259         c2_wr_set_id(&wr, CCWR_QP_MODIFY);
260         wr.hdr.context = (unsigned long) vq_req;
261         wr.rnic_handle = c2dev->adapter_handle;
262         wr.qp_handle = qp->adapter_handle;
263         wr.ord = cpu_to_be32(ord);
264         wr.ird = cpu_to_be32(ird);
265         wr.sq_depth = cpu_to_be32(C2_QP_NO_ATTR_CHANGE);
266         wr.rq_depth = cpu_to_be32(C2_QP_NO_ATTR_CHANGE);
267         wr.next_qp_state = cpu_to_be32(C2_QP_NO_ATTR_CHANGE);
268
269         /* reference the request struct */
270         vq_req_get(c2dev, vq_req);
271
272         err = vq_send_wr(c2dev, (union c2wr *) & wr);
273         if (err) {
274                 vq_req_put(c2dev, vq_req);
275                 goto bail0;
276         }
277
278         err = vq_wait_for_reply(c2dev, vq_req);
279         if (err)
280                 goto bail0;
281
282         reply = (struct c2wr_qp_modify_rep *) (unsigned long)
283                 vq_req->reply_msg;
284         if (!reply) {
285                 err = -ENOMEM;
286                 goto bail0;
287         }
288
289         err = c2_errno(reply);
290         vq_repbuf_free(c2dev, reply);
291       bail0:
292         vq_req_free(c2dev, vq_req);
293         return err;
294 }
295
296 static int destroy_qp(struct c2_dev *c2dev, struct c2_qp *qp)
297 {
298         struct c2_vq_req *vq_req;
299         struct c2wr_qp_destroy_req wr;
300         struct c2wr_qp_destroy_rep *reply;
301         unsigned long flags;
302         int err;
303
304         /*
305          * Allocate a verb request message
306          */
307         vq_req = vq_req_alloc(c2dev);
308         if (!vq_req) {
309                 return -ENOMEM;
310         }
311
312         /*
313          * Initialize the WR
314          */
315         c2_wr_set_id(&wr, CCWR_QP_DESTROY);
316         wr.hdr.context = (unsigned long) vq_req;
317         wr.rnic_handle = c2dev->adapter_handle;
318         wr.qp_handle = qp->adapter_handle;
319
320         /*
321          * reference the request struct.  dereferenced in the int handler.
322          */
323         vq_req_get(c2dev, vq_req);
324
325         spin_lock_irqsave(&qp->lock, flags);
326         if (qp->cm_id && qp->state == IB_QPS_RTS) {
327                 pr_debug("destroy_qp: generating CLOSE event for QP-->ERR, "
328                         "qp=%p, cm_id=%p\n",qp,qp->cm_id);
329                 /* Generate an CLOSE event */
330                 vq_req->qp = qp;
331                 vq_req->cm_id = qp->cm_id;
332                 vq_req->event = IW_CM_EVENT_CLOSE;
333         }
334         spin_unlock_irqrestore(&qp->lock, flags);
335
336         /*
337          * Send WR to adapter
338          */
339         err = vq_send_wr(c2dev, (union c2wr *) & wr);
340         if (err) {
341                 vq_req_put(c2dev, vq_req);
342                 goto bail0;
343         }
344
345         /*
346          * Wait for reply from adapter
347          */
348         err = vq_wait_for_reply(c2dev, vq_req);
349         if (err) {
350                 goto bail0;
351         }
352
353         /*
354          * Process reply
355          */
356         reply = (struct c2wr_qp_destroy_rep *) (unsigned long) (vq_req->reply_msg);
357         if (!reply) {
358                 err = -ENOMEM;
359                 goto bail0;
360         }
361
362         spin_lock_irqsave(&qp->lock, flags);
363         if (qp->cm_id) {
364                 qp->cm_id->rem_ref(qp->cm_id);
365                 qp->cm_id = NULL;
366         }
367         spin_unlock_irqrestore(&qp->lock, flags);
368
369         vq_repbuf_free(c2dev, reply);
370       bail0:
371         vq_req_free(c2dev, vq_req);
372         return err;
373 }
374
375 static int c2_alloc_qpn(struct c2_dev *c2dev, struct c2_qp *qp)
376 {
377         int ret;
378
379         do {
380                 spin_lock_irq(&c2dev->qp_table.lock);
381                 ret = idr_get_new_above(&c2dev->qp_table.idr, qp,
382                                         c2dev->qp_table.last++, &qp->qpn);
383                 spin_unlock_irq(&c2dev->qp_table.lock);
384         } while ((ret == -EAGAIN) &&
385                  idr_pre_get(&c2dev->qp_table.idr, GFP_KERNEL));
386         return ret;
387 }
388
389 static void c2_free_qpn(struct c2_dev *c2dev, int qpn)
390 {
391         spin_lock_irq(&c2dev->qp_table.lock);
392         idr_remove(&c2dev->qp_table.idr, qpn);
393         spin_unlock_irq(&c2dev->qp_table.lock);
394 }
395
396 struct c2_qp *c2_find_qpn(struct c2_dev *c2dev, int qpn)
397 {
398         unsigned long flags;
399         struct c2_qp *qp;
400
401         spin_lock_irqsave(&c2dev->qp_table.lock, flags);
402         qp = idr_find(&c2dev->qp_table.idr, qpn);
403         spin_unlock_irqrestore(&c2dev->qp_table.lock, flags);
404         return qp;
405 }
406
407 int c2_alloc_qp(struct c2_dev *c2dev,
408                 struct c2_pd *pd,
409                 struct ib_qp_init_attr *qp_attrs, struct c2_qp *qp)
410 {
411         struct c2wr_qp_create_req wr;
412         struct c2wr_qp_create_rep *reply;
413         struct c2_vq_req *vq_req;
414         struct c2_cq *send_cq = to_c2cq(qp_attrs->send_cq);
415         struct c2_cq *recv_cq = to_c2cq(qp_attrs->recv_cq);
416         unsigned long peer_pa;
417         u32 q_size, msg_size, mmap_size;
418         void __iomem *mmap;
419         int err;
420
421         err = c2_alloc_qpn(c2dev, qp);
422         if (err)
423                 return err;
424         qp->ibqp.qp_num = qp->qpn;
425         qp->ibqp.qp_type = IB_QPT_RC;
426
427         /* Allocate the SQ and RQ shared pointers */
428         qp->sq_mq.shared = c2_alloc_mqsp(c2dev, c2dev->kern_mqsp_pool,
429                                          &qp->sq_mq.shared_dma, GFP_KERNEL);
430         if (!qp->sq_mq.shared) {
431                 err = -ENOMEM;
432                 goto bail0;
433         }
434
435         qp->rq_mq.shared = c2_alloc_mqsp(c2dev, c2dev->kern_mqsp_pool,
436                                          &qp->rq_mq.shared_dma, GFP_KERNEL);
437         if (!qp->rq_mq.shared) {
438                 err = -ENOMEM;
439                 goto bail1;
440         }
441
442         /* Allocate the verbs request */
443         vq_req = vq_req_alloc(c2dev);
444         if (vq_req == NULL) {
445                 err = -ENOMEM;
446                 goto bail2;
447         }
448
449         /* Initialize the work request */
450         memset(&wr, 0, sizeof(wr));
451         c2_wr_set_id(&wr, CCWR_QP_CREATE);
452         wr.hdr.context = (unsigned long) vq_req;
453         wr.rnic_handle = c2dev->adapter_handle;
454         wr.sq_cq_handle = send_cq->adapter_handle;
455         wr.rq_cq_handle = recv_cq->adapter_handle;
456         wr.sq_depth = cpu_to_be32(qp_attrs->cap.max_send_wr + 1);
457         wr.rq_depth = cpu_to_be32(qp_attrs->cap.max_recv_wr + 1);
458         wr.srq_handle = 0;
459         wr.flags = cpu_to_be32(QP_RDMA_READ | QP_RDMA_WRITE | QP_MW_BIND |
460                                QP_ZERO_STAG | QP_RDMA_READ_RESPONSE);
461         wr.send_sgl_depth = cpu_to_be32(qp_attrs->cap.max_send_sge);
462         wr.recv_sgl_depth = cpu_to_be32(qp_attrs->cap.max_recv_sge);
463         wr.rdma_write_sgl_depth = cpu_to_be32(qp_attrs->cap.max_send_sge);
464         wr.shared_sq_ht = cpu_to_be64(qp->sq_mq.shared_dma);
465         wr.shared_rq_ht = cpu_to_be64(qp->rq_mq.shared_dma);
466         wr.ord = cpu_to_be32(C2_MAX_ORD_PER_QP);
467         wr.ird = cpu_to_be32(C2_MAX_IRD_PER_QP);
468         wr.pd_id = pd->pd_id;
469         wr.user_context = (unsigned long) qp;
470
471         vq_req_get(c2dev, vq_req);
472
473         /* Send the WR to the adapter */
474         err = vq_send_wr(c2dev, (union c2wr *) & wr);
475         if (err) {
476                 vq_req_put(c2dev, vq_req);
477                 goto bail3;
478         }
479
480         /* Wait for the verb reply  */
481         err = vq_wait_for_reply(c2dev, vq_req);
482         if (err) {
483                 goto bail3;
484         }
485
486         /* Process the reply */
487         reply = (struct c2wr_qp_create_rep *) (unsigned long) (vq_req->reply_msg);
488         if (!reply) {
489                 err = -ENOMEM;
490                 goto bail3;
491         }
492
493         if ((err = c2_wr_get_result(reply)) != 0) {
494                 goto bail4;
495         }
496
497         /* Fill in the kernel QP struct */
498         atomic_set(&qp->refcount, 1);
499         qp->adapter_handle = reply->qp_handle;
500         qp->state = IB_QPS_RESET;
501         qp->send_sgl_depth = qp_attrs->cap.max_send_sge;
502         qp->rdma_write_sgl_depth = qp_attrs->cap.max_send_sge;
503         qp->recv_sgl_depth = qp_attrs->cap.max_recv_sge;
504
505         /* Initialize the SQ MQ */
506         q_size = be32_to_cpu(reply->sq_depth);
507         msg_size = be32_to_cpu(reply->sq_msg_size);
508         peer_pa = c2dev->pa + be32_to_cpu(reply->sq_mq_start);
509         mmap_size = PAGE_ALIGN(sizeof(struct c2_mq_shared) + msg_size * q_size);
510         mmap = ioremap_nocache(peer_pa, mmap_size);
511         if (!mmap) {
512                 err = -ENOMEM;
513                 goto bail5;
514         }
515
516         c2_mq_req_init(&qp->sq_mq,
517                        be32_to_cpu(reply->sq_mq_index),
518                        q_size,
519                        msg_size,
520                        mmap + sizeof(struct c2_mq_shared),      /* pool start */
521                        mmap,                            /* peer */
522                        C2_MQ_ADAPTER_TARGET);
523
524         /* Initialize the RQ mq */
525         q_size = be32_to_cpu(reply->rq_depth);
526         msg_size = be32_to_cpu(reply->rq_msg_size);
527         peer_pa = c2dev->pa + be32_to_cpu(reply->rq_mq_start);
528         mmap_size = PAGE_ALIGN(sizeof(struct c2_mq_shared) + msg_size * q_size);
529         mmap = ioremap_nocache(peer_pa, mmap_size);
530         if (!mmap) {
531                 err = -ENOMEM;
532                 goto bail6;
533         }
534
535         c2_mq_req_init(&qp->rq_mq,
536                        be32_to_cpu(reply->rq_mq_index),
537                        q_size,
538                        msg_size,
539                        mmap + sizeof(struct c2_mq_shared),      /* pool start */
540                        mmap,                            /* peer */
541                        C2_MQ_ADAPTER_TARGET);
542
543         vq_repbuf_free(c2dev, reply);
544         vq_req_free(c2dev, vq_req);
545
546         return 0;
547
548       bail6:
549         iounmap(qp->sq_mq.peer);
550       bail5:
551         destroy_qp(c2dev, qp);
552       bail4:
553         vq_repbuf_free(c2dev, reply);
554       bail3:
555         vq_req_free(c2dev, vq_req);
556       bail2:
557         c2_free_mqsp(qp->rq_mq.shared);
558       bail1:
559         c2_free_mqsp(qp->sq_mq.shared);
560       bail0:
561         c2_free_qpn(c2dev, qp->qpn);
562         return err;
563 }
564
565 void c2_free_qp(struct c2_dev *c2dev, struct c2_qp *qp)
566 {
567         struct c2_cq *send_cq;
568         struct c2_cq *recv_cq;
569
570         send_cq = to_c2cq(qp->ibqp.send_cq);
571         recv_cq = to_c2cq(qp->ibqp.recv_cq);
572
573         /*
574          * Lock CQs here, so that CQ polling code can do QP lookup
575          * without taking a lock.
576          */
577         spin_lock_irq(&send_cq->lock);
578         if (send_cq != recv_cq)
579                 spin_lock(&recv_cq->lock);
580
581         c2_free_qpn(c2dev, qp->qpn);
582
583         if (send_cq != recv_cq)
584                 spin_unlock(&recv_cq->lock);
585         spin_unlock_irq(&send_cq->lock);
586
587         /*
588          * Destory qp in the rnic...
589          */
590         destroy_qp(c2dev, qp);
591
592         /*
593          * Mark any unreaped CQEs as null and void.
594          */
595         c2_cq_clean(c2dev, qp, send_cq->cqn);
596         if (send_cq != recv_cq)
597                 c2_cq_clean(c2dev, qp, recv_cq->cqn);
598         /*
599          * Unmap the MQs and return the shared pointers
600          * to the message pool.
601          */
602         iounmap(qp->sq_mq.peer);
603         iounmap(qp->rq_mq.peer);
604         c2_free_mqsp(qp->sq_mq.shared);
605         c2_free_mqsp(qp->rq_mq.shared);
606
607         atomic_dec(&qp->refcount);
608         wait_event(qp->wait, !atomic_read(&qp->refcount));
609 }
610
611 /*
612  * Function: move_sgl
613  *
614  * Description:
615  * Move an SGL from the user's work request struct into a CCIL Work Request
616  * message, swapping to WR byte order and ensure the total length doesn't
617  * overflow.
618  *
619  * IN:
620  * dst          - ptr to CCIL Work Request message SGL memory.
621  * src          - ptr to the consumers SGL memory.
622  *
623  * OUT: none
624  *
625  * Return:
626  * CCIL status codes.
627  */
628 static int
629 move_sgl(struct c2_data_addr * dst, struct ib_sge *src, int count, u32 * p_len,
630          u8 * actual_count)
631 {
632         u32 tot = 0;            /* running total */
633         u8 acount = 0;          /* running total non-0 len sge's */
634
635         while (count > 0) {
636                 /*
637                  * If the addition of this SGE causes the
638                  * total SGL length to exceed 2^32-1, then
639                  * fail-n-bail.
640                  *
641                  * If the current total plus the next element length
642                  * wraps, then it will go negative and be less than the
643                  * current total...
644                  */
645                 if ((tot + src->length) < tot) {
646                         return -EINVAL;
647                 }
648                 /*
649                  * Bug: 1456 (as well as 1498 & 1643)
650                  * Skip over any sge's supplied with len=0
651                  */
652                 if (src->length) {
653                         tot += src->length;
654                         dst->stag = cpu_to_be32(src->lkey);
655                         dst->to = cpu_to_be64(src->addr);
656                         dst->length = cpu_to_be32(src->length);
657                         dst++;
658                         acount++;
659                 }
660                 src++;
661                 count--;
662         }
663
664         if (acount == 0) {
665                 /*
666                  * Bug: 1476 (as well as 1498, 1456 and 1643)
667                  * Setup the SGL in the WR to make it easier for the RNIC.
668                  * This way, the FW doesn't have to deal with special cases.
669                  * Setting length=0 should be sufficient.
670                  */
671                 dst->stag = 0;
672                 dst->to = 0;
673                 dst->length = 0;
674         }
675
676         *p_len = tot;
677         *actual_count = acount;
678         return 0;
679 }
680
681 /*
682  * Function: c2_activity (private function)
683  *
684  * Description:
685  * Post an mq index to the host->adapter activity fifo.
686  *
687  * IN:
688  * c2dev        - ptr to c2dev structure
689  * mq_index     - mq index to post
690  * shared       - value most recently written to shared
691  *
692  * OUT:
693  *
694  * Return:
695  * none
696  */
697 static inline void c2_activity(struct c2_dev *c2dev, u32 mq_index, u16 shared)
698 {
699         /*
700          * First read the register to see if the FIFO is full, and if so,
701          * spin until it's not.  This isn't perfect -- there is no
702          * synchronization among the clients of the register, but in
703          * practice it prevents multiple CPU from hammering the bus
704          * with PCI RETRY. Note that when this does happen, the card
705          * cannot get on the bus and the card and system hang in a
706          * deadlock -- thus the need for this code. [TOT]
707          */
708         while (readl(c2dev->regs + PCI_BAR0_ADAPTER_HINT) & 0x80000000) {
709                 set_current_state(TASK_UNINTERRUPTIBLE);
710                 schedule_timeout(0);
711         }
712
713         __raw_writel(C2_HINT_MAKE(mq_index, shared),
714                      c2dev->regs + PCI_BAR0_ADAPTER_HINT);
715 }
716
717 /*
718  * Function: qp_wr_post
719  *
720  * Description:
721  * This in-line function allocates a MQ msg, then moves the host-copy of
722  * the completed WR into msg.  Then it posts the message.
723  *
724  * IN:
725  * q            - ptr to user MQ.
726  * wr           - ptr to host-copy of the WR.
727  * qp           - ptr to user qp
728  * size         - Number of bytes to post.  Assumed to be divisible by 4.
729  *
730  * OUT: none
731  *
732  * Return:
733  * CCIL status codes.
734  */
735 static int qp_wr_post(struct c2_mq *q, union c2wr * wr, struct c2_qp *qp, u32 size)
736 {
737         union c2wr *msg;
738
739         msg = c2_mq_alloc(q);
740         if (msg == NULL) {
741                 return -EINVAL;
742         }
743 #ifdef CCMSGMAGIC
744         ((c2wr_hdr_t *) wr)->magic = cpu_to_be32(CCWR_MAGIC);
745 #endif
746
747         /*
748          * Since all header fields in the WR are the same as the
749          * CQE, set the following so the adapter need not.
750          */
751         c2_wr_set_result(wr, CCERR_PENDING);
752
753         /*
754          * Copy the wr down to the adapter
755          */
756         memcpy((void *) msg, (void *) wr, size);
757
758         c2_mq_produce(q);
759         return 0;
760 }
761
762
763 int c2_post_send(struct ib_qp *ibqp, struct ib_send_wr *ib_wr,
764                  struct ib_send_wr **bad_wr)
765 {
766         struct c2_dev *c2dev = to_c2dev(ibqp->device);
767         struct c2_qp *qp = to_c2qp(ibqp);
768         union c2wr wr;
769         int err = 0;
770
771         u32 flags;
772         u32 tot_len;
773         u8 actual_sge_count;
774         u32 msg_size;
775
776         if (qp->state > IB_QPS_RTS)
777                 return -EINVAL;
778
779         while (ib_wr) {
780
781                 flags = 0;
782                 wr.sqwr.sq_hdr.user_hdr.hdr.context = ib_wr->wr_id;
783                 if (ib_wr->send_flags & IB_SEND_SIGNALED) {
784                         flags |= SQ_SIGNALED;
785                 }
786
787                 switch (ib_wr->opcode) {
788                 case IB_WR_SEND:
789                         if (ib_wr->send_flags & IB_SEND_SOLICITED) {
790                                 c2_wr_set_id(&wr, C2_WR_TYPE_SEND_SE);
791                                 msg_size = sizeof(struct c2wr_send_req);
792                         } else {
793                                 c2_wr_set_id(&wr, C2_WR_TYPE_SEND);
794                                 msg_size = sizeof(struct c2wr_send_req);
795                         }
796
797                         wr.sqwr.send.remote_stag = 0;
798                         msg_size += sizeof(struct c2_data_addr) * ib_wr->num_sge;
799                         if (ib_wr->num_sge > qp->send_sgl_depth) {
800                                 err = -EINVAL;
801                                 break;
802                         }
803                         if (ib_wr->send_flags & IB_SEND_FENCE) {
804                                 flags |= SQ_READ_FENCE;
805                         }
806                         err = move_sgl((struct c2_data_addr *) & (wr.sqwr.send.data),
807                                        ib_wr->sg_list,
808                                        ib_wr->num_sge,
809                                        &tot_len, &actual_sge_count);
810                         wr.sqwr.send.sge_len = cpu_to_be32(tot_len);
811                         c2_wr_set_sge_count(&wr, actual_sge_count);
812                         break;
813                 case IB_WR_RDMA_WRITE:
814                         c2_wr_set_id(&wr, C2_WR_TYPE_RDMA_WRITE);
815                         msg_size = sizeof(struct c2wr_rdma_write_req) +
816                             (sizeof(struct c2_data_addr) * ib_wr->num_sge);
817                         if (ib_wr->num_sge > qp->rdma_write_sgl_depth) {
818                                 err = -EINVAL;
819                                 break;
820                         }
821                         if (ib_wr->send_flags & IB_SEND_FENCE) {
822                                 flags |= SQ_READ_FENCE;
823                         }
824                         wr.sqwr.rdma_write.remote_stag =
825                             cpu_to_be32(ib_wr->wr.rdma.rkey);
826                         wr.sqwr.rdma_write.remote_to =
827                             cpu_to_be64(ib_wr->wr.rdma.remote_addr);
828                         err = move_sgl((struct c2_data_addr *)
829                                        & (wr.sqwr.rdma_write.data),
830                                        ib_wr->sg_list,
831                                        ib_wr->num_sge,
832                                        &tot_len, &actual_sge_count);
833                         wr.sqwr.rdma_write.sge_len = cpu_to_be32(tot_len);
834                         c2_wr_set_sge_count(&wr, actual_sge_count);
835                         break;
836                 case IB_WR_RDMA_READ:
837                         c2_wr_set_id(&wr, C2_WR_TYPE_RDMA_READ);
838                         msg_size = sizeof(struct c2wr_rdma_read_req);
839
840                         /* IWarp only suppots 1 sge for RDMA reads */
841                         if (ib_wr->num_sge > 1) {
842                                 err = -EINVAL;
843                                 break;
844                         }
845
846                         /*
847                          * Move the local and remote stag/to/len into the WR.
848                          */
849                         wr.sqwr.rdma_read.local_stag =
850                             cpu_to_be32(ib_wr->sg_list->lkey);
851                         wr.sqwr.rdma_read.local_to =
852                             cpu_to_be64(ib_wr->sg_list->addr);
853                         wr.sqwr.rdma_read.remote_stag =
854                             cpu_to_be32(ib_wr->wr.rdma.rkey);
855                         wr.sqwr.rdma_read.remote_to =
856                             cpu_to_be64(ib_wr->wr.rdma.remote_addr);
857                         wr.sqwr.rdma_read.length =
858                             cpu_to_be32(ib_wr->sg_list->length);
859                         break;
860                 default:
861                         /* error */
862                         msg_size = 0;
863                         err = -EINVAL;
864                         break;
865                 }
866
867                 /*
868                  * If we had an error on the last wr build, then
869                  * break out.  Possible errors include bogus WR
870                  * type, and a bogus SGL length...
871                  */
872                 if (err) {
873                         break;
874                 }
875
876                 /*
877                  * Store flags
878                  */
879                 c2_wr_set_flags(&wr, flags);
880
881                 /*
882                  * Post the puppy!
883                  */
884                 err = qp_wr_post(&qp->sq_mq, &wr, qp, msg_size);
885                 if (err) {
886                         break;
887                 }
888
889                 /*
890                  * Enqueue mq index to activity FIFO.
891                  */
892                 c2_activity(c2dev, qp->sq_mq.index, qp->sq_mq.hint_count);
893
894                 ib_wr = ib_wr->next;
895         }
896
897         if (err)
898                 *bad_wr = ib_wr;
899         return err;
900 }
901
902 int c2_post_receive(struct ib_qp *ibqp, struct ib_recv_wr *ib_wr,
903                     struct ib_recv_wr **bad_wr)
904 {
905         struct c2_dev *c2dev = to_c2dev(ibqp->device);
906         struct c2_qp *qp = to_c2qp(ibqp);
907         union c2wr wr;
908         int err = 0;
909
910         if (qp->state > IB_QPS_RTS)
911                 return -EINVAL;
912
913         /*
914          * Try and post each work request
915          */
916         while (ib_wr) {
917                 u32 tot_len;
918                 u8 actual_sge_count;
919
920                 if (ib_wr->num_sge > qp->recv_sgl_depth) {
921                         err = -EINVAL;
922                         break;
923                 }
924
925                 /*
926                  * Create local host-copy of the WR
927                  */
928                 wr.rqwr.rq_hdr.user_hdr.hdr.context = ib_wr->wr_id;
929                 c2_wr_set_id(&wr, CCWR_RECV);
930                 c2_wr_set_flags(&wr, 0);
931
932                 /* sge_count is limited to eight bits. */
933                 BUG_ON(ib_wr->num_sge >= 256);
934                 err = move_sgl((struct c2_data_addr *) & (wr.rqwr.data),
935                                ib_wr->sg_list,
936                                ib_wr->num_sge, &tot_len, &actual_sge_count);
937                 c2_wr_set_sge_count(&wr, actual_sge_count);
938
939                 /*
940                  * If we had an error on the last wr build, then
941                  * break out.  Possible errors include bogus WR
942                  * type, and a bogus SGL length...
943                  */
944                 if (err) {
945                         break;
946                 }
947
948                 err = qp_wr_post(&qp->rq_mq, &wr, qp, qp->rq_mq.msg_size);
949                 if (err) {
950                         break;
951                 }
952
953                 /*
954                  * Enqueue mq index to activity FIFO
955                  */
956                 c2_activity(c2dev, qp->rq_mq.index, qp->rq_mq.hint_count);
957
958                 ib_wr = ib_wr->next;
959         }
960
961         if (err)
962                 *bad_wr = ib_wr;
963         return err;
964 }
965
966 void __devinit c2_init_qp_table(struct c2_dev *c2dev)
967 {
968         spin_lock_init(&c2dev->qp_table.lock);
969         idr_init(&c2dev->qp_table.idr);
970 }
971
972 void __devexit c2_cleanup_qp_table(struct c2_dev *c2dev)
973 {
974         idr_destroy(&c2dev->qp_table.idr);
975 }