Manual merge with Linus.
[pandora-kernel.git] / drivers / infiniband / core / mad.c
1 /*
2  * Copyright (c) 2004, 2005 Voltaire, Inc. All rights reserved.
3  * Copyright (c) 2005 Intel Corporation.  All rights reserved.
4  * Copyright (c) 2005 Mellanox Technologies Ltd.  All rights reserved.
5  *
6  * This software is available to you under a choice of one of two
7  * licenses.  You may choose to be licensed under the terms of the GNU
8  * General Public License (GPL) Version 2, available from the file
9  * COPYING in the main directory of this source tree, or the
10  * OpenIB.org BSD license below:
11  *
12  *     Redistribution and use in source and binary forms, with or
13  *     without modification, are permitted provided that the following
14  *     conditions are met:
15  *
16  *      - Redistributions of source code must retain the above
17  *        copyright notice, this list of conditions and the following
18  *        disclaimer.
19  *
20  *      - Redistributions in binary form must reproduce the above
21  *        copyright notice, this list of conditions and the following
22  *        disclaimer in the documentation and/or other materials
23  *        provided with the distribution.
24  *
25  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
26  * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
27  * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
28  * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
29  * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
30  * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
31  * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
32  * SOFTWARE.
33  *
34  * $Id: mad.c 5596 2006-03-03 01:00:07Z sean.hefty $
35  */
36 #include <linux/dma-mapping.h>
37
38 #include "mad_priv.h"
39 #include "mad_rmpp.h"
40 #include "smi.h"
41 #include "agent.h"
42
43 MODULE_LICENSE("Dual BSD/GPL");
44 MODULE_DESCRIPTION("kernel IB MAD API");
45 MODULE_AUTHOR("Hal Rosenstock");
46 MODULE_AUTHOR("Sean Hefty");
47
48
49 kmem_cache_t *ib_mad_cache;
50
51 static struct list_head ib_mad_port_list;
52 static u32 ib_mad_client_id = 0;
53
54 /* Port list lock */
55 static spinlock_t ib_mad_port_list_lock;
56
57
58 /* Forward declarations */
59 static int method_in_use(struct ib_mad_mgmt_method_table **method,
60                          struct ib_mad_reg_req *mad_reg_req);
61 static void remove_mad_reg_req(struct ib_mad_agent_private *priv);
62 static struct ib_mad_agent_private *find_mad_agent(
63                                         struct ib_mad_port_private *port_priv,
64                                         struct ib_mad *mad);
65 static int ib_mad_post_receive_mads(struct ib_mad_qp_info *qp_info,
66                                     struct ib_mad_private *mad);
67 static void cancel_mads(struct ib_mad_agent_private *mad_agent_priv);
68 static void timeout_sends(void *data);
69 static void local_completions(void *data);
70 static int add_nonoui_reg_req(struct ib_mad_reg_req *mad_reg_req,
71                               struct ib_mad_agent_private *agent_priv,
72                               u8 mgmt_class);
73 static int add_oui_reg_req(struct ib_mad_reg_req *mad_reg_req,
74                            struct ib_mad_agent_private *agent_priv);
75
76 /*
77  * Returns a ib_mad_port_private structure or NULL for a device/port
78  * Assumes ib_mad_port_list_lock is being held
79  */
80 static inline struct ib_mad_port_private *
81 __ib_get_mad_port(struct ib_device *device, int port_num)
82 {
83         struct ib_mad_port_private *entry;
84
85         list_for_each_entry(entry, &ib_mad_port_list, port_list) {
86                 if (entry->device == device && entry->port_num == port_num)
87                         return entry;
88         }
89         return NULL;
90 }
91
92 /*
93  * Wrapper function to return a ib_mad_port_private structure or NULL
94  * for a device/port
95  */
96 static inline struct ib_mad_port_private *
97 ib_get_mad_port(struct ib_device *device, int port_num)
98 {
99         struct ib_mad_port_private *entry;
100         unsigned long flags;
101
102         spin_lock_irqsave(&ib_mad_port_list_lock, flags);
103         entry = __ib_get_mad_port(device, port_num);
104         spin_unlock_irqrestore(&ib_mad_port_list_lock, flags);
105
106         return entry;
107 }
108
109 static inline u8 convert_mgmt_class(u8 mgmt_class)
110 {
111         /* Alias IB_MGMT_CLASS_SUBN_DIRECTED_ROUTE to 0 */
112         return mgmt_class == IB_MGMT_CLASS_SUBN_DIRECTED_ROUTE ?
113                 0 : mgmt_class;
114 }
115
116 static int get_spl_qp_index(enum ib_qp_type qp_type)
117 {
118         switch (qp_type)
119         {
120         case IB_QPT_SMI:
121                 return 0;
122         case IB_QPT_GSI:
123                 return 1;
124         default:
125                 return -1;
126         }
127 }
128
129 static int vendor_class_index(u8 mgmt_class)
130 {
131         return mgmt_class - IB_MGMT_CLASS_VENDOR_RANGE2_START;
132 }
133
134 static int is_vendor_class(u8 mgmt_class)
135 {
136         if ((mgmt_class < IB_MGMT_CLASS_VENDOR_RANGE2_START) ||
137             (mgmt_class > IB_MGMT_CLASS_VENDOR_RANGE2_END))
138                 return 0;
139         return 1;
140 }
141
142 static int is_vendor_oui(char *oui)
143 {
144         if (oui[0] || oui[1] || oui[2])
145                 return 1;
146         return 0;
147 }
148
149 static int is_vendor_method_in_use(
150                 struct ib_mad_mgmt_vendor_class *vendor_class,
151                 struct ib_mad_reg_req *mad_reg_req)
152 {
153         struct ib_mad_mgmt_method_table *method;
154         int i;
155
156         for (i = 0; i < MAX_MGMT_OUI; i++) {
157                 if (!memcmp(vendor_class->oui[i], mad_reg_req->oui, 3)) {
158                         method = vendor_class->method_table[i];
159                         if (method) {
160                                 if (method_in_use(&method, mad_reg_req))
161                                         return 1;
162                                 else
163                                         break;
164                         }
165                 }
166         }
167         return 0;
168 }
169
170 /*
171  * ib_register_mad_agent - Register to send/receive MADs
172  */
173 struct ib_mad_agent *ib_register_mad_agent(struct ib_device *device,
174                                            u8 port_num,
175                                            enum ib_qp_type qp_type,
176                                            struct ib_mad_reg_req *mad_reg_req,
177                                            u8 rmpp_version,
178                                            ib_mad_send_handler send_handler,
179                                            ib_mad_recv_handler recv_handler,
180                                            void *context)
181 {
182         struct ib_mad_port_private *port_priv;
183         struct ib_mad_agent *ret = ERR_PTR(-EINVAL);
184         struct ib_mad_agent_private *mad_agent_priv;
185         struct ib_mad_reg_req *reg_req = NULL;
186         struct ib_mad_mgmt_class_table *class;
187         struct ib_mad_mgmt_vendor_class_table *vendor;
188         struct ib_mad_mgmt_vendor_class *vendor_class;
189         struct ib_mad_mgmt_method_table *method;
190         int ret2, qpn;
191         unsigned long flags;
192         u8 mgmt_class, vclass;
193
194         /* Validate parameters */
195         qpn = get_spl_qp_index(qp_type);
196         if (qpn == -1)
197                 goto error1;
198
199         if (rmpp_version && rmpp_version != IB_MGMT_RMPP_VERSION)
200                 goto error1;
201
202         /* Validate MAD registration request if supplied */
203         if (mad_reg_req) {
204                 if (mad_reg_req->mgmt_class_version >= MAX_MGMT_VERSION)
205                         goto error1;
206                 if (!recv_handler)
207                         goto error1;
208                 if (mad_reg_req->mgmt_class >= MAX_MGMT_CLASS) {
209                         /*
210                          * IB_MGMT_CLASS_SUBN_DIRECTED_ROUTE is the only
211                          * one in this range currently allowed
212                          */
213                         if (mad_reg_req->mgmt_class !=
214                             IB_MGMT_CLASS_SUBN_DIRECTED_ROUTE)
215                                 goto error1;
216                 } else if (mad_reg_req->mgmt_class == 0) {
217                         /*
218                          * Class 0 is reserved in IBA and is used for
219                          * aliasing of IB_MGMT_CLASS_SUBN_DIRECTED_ROUTE
220                          */
221                         goto error1;
222                 } else if (is_vendor_class(mad_reg_req->mgmt_class)) {
223                         /*
224                          * If class is in "new" vendor range,
225                          * ensure supplied OUI is not zero
226                          */
227                         if (!is_vendor_oui(mad_reg_req->oui))
228                                 goto error1;
229                 }
230                 /* Make sure class supplied is consistent with RMPP */
231                 if (ib_is_mad_class_rmpp(mad_reg_req->mgmt_class)) {
232                         if (!rmpp_version)
233                                 goto error1;
234                 } else {
235                         if (rmpp_version)
236                                 goto error1;
237                 }
238                 /* Make sure class supplied is consistent with QP type */
239                 if (qp_type == IB_QPT_SMI) {
240                         if ((mad_reg_req->mgmt_class !=
241                                         IB_MGMT_CLASS_SUBN_LID_ROUTED) &&
242                             (mad_reg_req->mgmt_class !=
243                                         IB_MGMT_CLASS_SUBN_DIRECTED_ROUTE))
244                                 goto error1;
245                 } else {
246                         if ((mad_reg_req->mgmt_class ==
247                                         IB_MGMT_CLASS_SUBN_LID_ROUTED) ||
248                             (mad_reg_req->mgmt_class ==
249                                         IB_MGMT_CLASS_SUBN_DIRECTED_ROUTE))
250                                 goto error1;
251                 }
252         } else {
253                 /* No registration request supplied */
254                 if (!send_handler)
255                         goto error1;
256         }
257
258         /* Validate device and port */
259         port_priv = ib_get_mad_port(device, port_num);
260         if (!port_priv) {
261                 ret = ERR_PTR(-ENODEV);
262                 goto error1;
263         }
264
265         /* Allocate structures */
266         mad_agent_priv = kzalloc(sizeof *mad_agent_priv, GFP_KERNEL);
267         if (!mad_agent_priv) {
268                 ret = ERR_PTR(-ENOMEM);
269                 goto error1;
270         }
271
272         mad_agent_priv->agent.mr = ib_get_dma_mr(port_priv->qp_info[qpn].qp->pd,
273                                                  IB_ACCESS_LOCAL_WRITE);
274         if (IS_ERR(mad_agent_priv->agent.mr)) {
275                 ret = ERR_PTR(-ENOMEM);
276                 goto error2;
277         }
278
279         if (mad_reg_req) {
280                 reg_req = kmalloc(sizeof *reg_req, GFP_KERNEL);
281                 if (!reg_req) {
282                         ret = ERR_PTR(-ENOMEM);
283                         goto error3;
284                 }
285                 /* Make a copy of the MAD registration request */
286                 memcpy(reg_req, mad_reg_req, sizeof *reg_req);
287         }
288
289         /* Now, fill in the various structures */
290         mad_agent_priv->qp_info = &port_priv->qp_info[qpn];
291         mad_agent_priv->reg_req = reg_req;
292         mad_agent_priv->agent.rmpp_version = rmpp_version;
293         mad_agent_priv->agent.device = device;
294         mad_agent_priv->agent.recv_handler = recv_handler;
295         mad_agent_priv->agent.send_handler = send_handler;
296         mad_agent_priv->agent.context = context;
297         mad_agent_priv->agent.qp = port_priv->qp_info[qpn].qp;
298         mad_agent_priv->agent.port_num = port_num;
299
300         spin_lock_irqsave(&port_priv->reg_lock, flags);
301         mad_agent_priv->agent.hi_tid = ++ib_mad_client_id;
302
303         /*
304          * Make sure MAD registration (if supplied)
305          * is non overlapping with any existing ones
306          */
307         if (mad_reg_req) {
308                 mgmt_class = convert_mgmt_class(mad_reg_req->mgmt_class);
309                 if (!is_vendor_class(mgmt_class)) {
310                         class = port_priv->version[mad_reg_req->
311                                                    mgmt_class_version].class;
312                         if (class) {
313                                 method = class->method_table[mgmt_class];
314                                 if (method) {
315                                         if (method_in_use(&method,
316                                                            mad_reg_req))
317                                                 goto error4;
318                                 }
319                         }
320                         ret2 = add_nonoui_reg_req(mad_reg_req, mad_agent_priv,
321                                                   mgmt_class);
322                 } else {
323                         /* "New" vendor class range */
324                         vendor = port_priv->version[mad_reg_req->
325                                                     mgmt_class_version].vendor;
326                         if (vendor) {
327                                 vclass = vendor_class_index(mgmt_class);
328                                 vendor_class = vendor->vendor_class[vclass];
329                                 if (vendor_class) {
330                                         if (is_vendor_method_in_use(
331                                                         vendor_class,
332                                                         mad_reg_req))
333                                                 goto error4;
334                                 }
335                         }
336                         ret2 = add_oui_reg_req(mad_reg_req, mad_agent_priv);
337                 }
338                 if (ret2) {
339                         ret = ERR_PTR(ret2);
340                         goto error4;
341                 }
342         }
343
344         /* Add mad agent into port's agent list */
345         list_add_tail(&mad_agent_priv->agent_list, &port_priv->agent_list);
346         spin_unlock_irqrestore(&port_priv->reg_lock, flags);
347
348         spin_lock_init(&mad_agent_priv->lock);
349         INIT_LIST_HEAD(&mad_agent_priv->send_list);
350         INIT_LIST_HEAD(&mad_agent_priv->wait_list);
351         INIT_LIST_HEAD(&mad_agent_priv->done_list);
352         INIT_LIST_HEAD(&mad_agent_priv->rmpp_list);
353         INIT_WORK(&mad_agent_priv->timed_work, timeout_sends, mad_agent_priv);
354         INIT_LIST_HEAD(&mad_agent_priv->local_list);
355         INIT_WORK(&mad_agent_priv->local_work, local_completions,
356                    mad_agent_priv);
357         atomic_set(&mad_agent_priv->refcount, 1);
358         init_waitqueue_head(&mad_agent_priv->wait);
359
360         return &mad_agent_priv->agent;
361
362 error4:
363         spin_unlock_irqrestore(&port_priv->reg_lock, flags);
364         kfree(reg_req);
365 error3:
366         ib_dereg_mr(mad_agent_priv->agent.mr);
367 error2:
368         kfree(mad_agent_priv);
369 error1:
370         return ret;
371 }
372 EXPORT_SYMBOL(ib_register_mad_agent);
373
374 static inline int is_snooping_sends(int mad_snoop_flags)
375 {
376         return (mad_snoop_flags &
377                 (/*IB_MAD_SNOOP_POSTED_SENDS |
378                  IB_MAD_SNOOP_RMPP_SENDS |*/
379                  IB_MAD_SNOOP_SEND_COMPLETIONS /*|
380                  IB_MAD_SNOOP_RMPP_SEND_COMPLETIONS*/));
381 }
382
383 static inline int is_snooping_recvs(int mad_snoop_flags)
384 {
385         return (mad_snoop_flags &
386                 (IB_MAD_SNOOP_RECVS /*|
387                  IB_MAD_SNOOP_RMPP_RECVS*/));
388 }
389
390 static int register_snoop_agent(struct ib_mad_qp_info *qp_info,
391                                 struct ib_mad_snoop_private *mad_snoop_priv)
392 {
393         struct ib_mad_snoop_private **new_snoop_table;
394         unsigned long flags;
395         int i;
396
397         spin_lock_irqsave(&qp_info->snoop_lock, flags);
398         /* Check for empty slot in array. */
399         for (i = 0; i < qp_info->snoop_table_size; i++)
400                 if (!qp_info->snoop_table[i])
401                         break;
402
403         if (i == qp_info->snoop_table_size) {
404                 /* Grow table. */
405                 new_snoop_table = kmalloc(sizeof mad_snoop_priv *
406                                           qp_info->snoop_table_size + 1,
407                                           GFP_ATOMIC);
408                 if (!new_snoop_table) {
409                         i = -ENOMEM;
410                         goto out;
411                 }
412                 if (qp_info->snoop_table) {
413                         memcpy(new_snoop_table, qp_info->snoop_table,
414                                sizeof mad_snoop_priv *
415                                qp_info->snoop_table_size);
416                         kfree(qp_info->snoop_table);
417                 }
418                 qp_info->snoop_table = new_snoop_table;
419                 qp_info->snoop_table_size++;
420         }
421         qp_info->snoop_table[i] = mad_snoop_priv;
422         atomic_inc(&qp_info->snoop_count);
423 out:
424         spin_unlock_irqrestore(&qp_info->snoop_lock, flags);
425         return i;
426 }
427
428 struct ib_mad_agent *ib_register_mad_snoop(struct ib_device *device,
429                                            u8 port_num,
430                                            enum ib_qp_type qp_type,
431                                            int mad_snoop_flags,
432                                            ib_mad_snoop_handler snoop_handler,
433                                            ib_mad_recv_handler recv_handler,
434                                            void *context)
435 {
436         struct ib_mad_port_private *port_priv;
437         struct ib_mad_agent *ret;
438         struct ib_mad_snoop_private *mad_snoop_priv;
439         int qpn;
440
441         /* Validate parameters */
442         if ((is_snooping_sends(mad_snoop_flags) && !snoop_handler) ||
443             (is_snooping_recvs(mad_snoop_flags) && !recv_handler)) {
444                 ret = ERR_PTR(-EINVAL);
445                 goto error1;
446         }
447         qpn = get_spl_qp_index(qp_type);
448         if (qpn == -1) {
449                 ret = ERR_PTR(-EINVAL);
450                 goto error1;
451         }
452         port_priv = ib_get_mad_port(device, port_num);
453         if (!port_priv) {
454                 ret = ERR_PTR(-ENODEV);
455                 goto error1;
456         }
457         /* Allocate structures */
458         mad_snoop_priv = kzalloc(sizeof *mad_snoop_priv, GFP_KERNEL);
459         if (!mad_snoop_priv) {
460                 ret = ERR_PTR(-ENOMEM);
461                 goto error1;
462         }
463
464         /* Now, fill in the various structures */
465         mad_snoop_priv->qp_info = &port_priv->qp_info[qpn];
466         mad_snoop_priv->agent.device = device;
467         mad_snoop_priv->agent.recv_handler = recv_handler;
468         mad_snoop_priv->agent.snoop_handler = snoop_handler;
469         mad_snoop_priv->agent.context = context;
470         mad_snoop_priv->agent.qp = port_priv->qp_info[qpn].qp;
471         mad_snoop_priv->agent.port_num = port_num;
472         mad_snoop_priv->mad_snoop_flags = mad_snoop_flags;
473         init_waitqueue_head(&mad_snoop_priv->wait);
474         mad_snoop_priv->snoop_index = register_snoop_agent(
475                                                 &port_priv->qp_info[qpn],
476                                                 mad_snoop_priv);
477         if (mad_snoop_priv->snoop_index < 0) {
478                 ret = ERR_PTR(mad_snoop_priv->snoop_index);
479                 goto error2;
480         }
481
482         atomic_set(&mad_snoop_priv->refcount, 1);
483         return &mad_snoop_priv->agent;
484
485 error2:
486         kfree(mad_snoop_priv);
487 error1:
488         return ret;
489 }
490 EXPORT_SYMBOL(ib_register_mad_snoop);
491
492 static void unregister_mad_agent(struct ib_mad_agent_private *mad_agent_priv)
493 {
494         struct ib_mad_port_private *port_priv;
495         unsigned long flags;
496
497         /* Note that we could still be handling received MADs */
498
499         /*
500          * Canceling all sends results in dropping received response
501          * MADs, preventing us from queuing additional work
502          */
503         cancel_mads(mad_agent_priv);
504         port_priv = mad_agent_priv->qp_info->port_priv;
505         cancel_delayed_work(&mad_agent_priv->timed_work);
506
507         spin_lock_irqsave(&port_priv->reg_lock, flags);
508         remove_mad_reg_req(mad_agent_priv);
509         list_del(&mad_agent_priv->agent_list);
510         spin_unlock_irqrestore(&port_priv->reg_lock, flags);
511
512         flush_workqueue(port_priv->wq);
513         ib_cancel_rmpp_recvs(mad_agent_priv);
514
515         atomic_dec(&mad_agent_priv->refcount);
516         wait_event(mad_agent_priv->wait,
517                    !atomic_read(&mad_agent_priv->refcount));
518
519         kfree(mad_agent_priv->reg_req);
520         ib_dereg_mr(mad_agent_priv->agent.mr);
521         kfree(mad_agent_priv);
522 }
523
524 static void unregister_mad_snoop(struct ib_mad_snoop_private *mad_snoop_priv)
525 {
526         struct ib_mad_qp_info *qp_info;
527         unsigned long flags;
528
529         qp_info = mad_snoop_priv->qp_info;
530         spin_lock_irqsave(&qp_info->snoop_lock, flags);
531         qp_info->snoop_table[mad_snoop_priv->snoop_index] = NULL;
532         atomic_dec(&qp_info->snoop_count);
533         spin_unlock_irqrestore(&qp_info->snoop_lock, flags);
534
535         atomic_dec(&mad_snoop_priv->refcount);
536         wait_event(mad_snoop_priv->wait,
537                    !atomic_read(&mad_snoop_priv->refcount));
538
539         kfree(mad_snoop_priv);
540 }
541
542 /*
543  * ib_unregister_mad_agent - Unregisters a client from using MAD services
544  */
545 int ib_unregister_mad_agent(struct ib_mad_agent *mad_agent)
546 {
547         struct ib_mad_agent_private *mad_agent_priv;
548         struct ib_mad_snoop_private *mad_snoop_priv;
549
550         /* If the TID is zero, the agent can only snoop. */
551         if (mad_agent->hi_tid) {
552                 mad_agent_priv = container_of(mad_agent,
553                                               struct ib_mad_agent_private,
554                                               agent);
555                 unregister_mad_agent(mad_agent_priv);
556         } else {
557                 mad_snoop_priv = container_of(mad_agent,
558                                               struct ib_mad_snoop_private,
559                                               agent);
560                 unregister_mad_snoop(mad_snoop_priv);
561         }
562         return 0;
563 }
564 EXPORT_SYMBOL(ib_unregister_mad_agent);
565
566 static inline int response_mad(struct ib_mad *mad)
567 {
568         /* Trap represses are responses although response bit is reset */
569         return ((mad->mad_hdr.method == IB_MGMT_METHOD_TRAP_REPRESS) ||
570                 (mad->mad_hdr.method & IB_MGMT_METHOD_RESP));
571 }
572
573 static void dequeue_mad(struct ib_mad_list_head *mad_list)
574 {
575         struct ib_mad_queue *mad_queue;
576         unsigned long flags;
577
578         BUG_ON(!mad_list->mad_queue);
579         mad_queue = mad_list->mad_queue;
580         spin_lock_irqsave(&mad_queue->lock, flags);
581         list_del(&mad_list->list);
582         mad_queue->count--;
583         spin_unlock_irqrestore(&mad_queue->lock, flags);
584 }
585
586 static void snoop_send(struct ib_mad_qp_info *qp_info,
587                        struct ib_mad_send_buf *send_buf,
588                        struct ib_mad_send_wc *mad_send_wc,
589                        int mad_snoop_flags)
590 {
591         struct ib_mad_snoop_private *mad_snoop_priv;
592         unsigned long flags;
593         int i;
594
595         spin_lock_irqsave(&qp_info->snoop_lock, flags);
596         for (i = 0; i < qp_info->snoop_table_size; i++) {
597                 mad_snoop_priv = qp_info->snoop_table[i];
598                 if (!mad_snoop_priv ||
599                     !(mad_snoop_priv->mad_snoop_flags & mad_snoop_flags))
600                         continue;
601
602                 atomic_inc(&mad_snoop_priv->refcount);
603                 spin_unlock_irqrestore(&qp_info->snoop_lock, flags);
604                 mad_snoop_priv->agent.snoop_handler(&mad_snoop_priv->agent,
605                                                     send_buf, mad_send_wc);
606                 if (atomic_dec_and_test(&mad_snoop_priv->refcount))
607                         wake_up(&mad_snoop_priv->wait);
608                 spin_lock_irqsave(&qp_info->snoop_lock, flags);
609         }
610         spin_unlock_irqrestore(&qp_info->snoop_lock, flags);
611 }
612
613 static void snoop_recv(struct ib_mad_qp_info *qp_info,
614                        struct ib_mad_recv_wc *mad_recv_wc,
615                        int mad_snoop_flags)
616 {
617         struct ib_mad_snoop_private *mad_snoop_priv;
618         unsigned long flags;
619         int i;
620
621         spin_lock_irqsave(&qp_info->snoop_lock, flags);
622         for (i = 0; i < qp_info->snoop_table_size; i++) {
623                 mad_snoop_priv = qp_info->snoop_table[i];
624                 if (!mad_snoop_priv ||
625                     !(mad_snoop_priv->mad_snoop_flags & mad_snoop_flags))
626                         continue;
627
628                 atomic_inc(&mad_snoop_priv->refcount);
629                 spin_unlock_irqrestore(&qp_info->snoop_lock, flags);
630                 mad_snoop_priv->agent.recv_handler(&mad_snoop_priv->agent,
631                                                    mad_recv_wc);
632                 if (atomic_dec_and_test(&mad_snoop_priv->refcount))
633                         wake_up(&mad_snoop_priv->wait);
634                 spin_lock_irqsave(&qp_info->snoop_lock, flags);
635         }
636         spin_unlock_irqrestore(&qp_info->snoop_lock, flags);
637 }
638
639 static void build_smp_wc(u64 wr_id, u16 slid, u16 pkey_index, u8 port_num,
640                          struct ib_wc *wc)
641 {
642         memset(wc, 0, sizeof *wc);
643         wc->wr_id = wr_id;
644         wc->status = IB_WC_SUCCESS;
645         wc->opcode = IB_WC_RECV;
646         wc->pkey_index = pkey_index;
647         wc->byte_len = sizeof(struct ib_mad) + sizeof(struct ib_grh);
648         wc->src_qp = IB_QP0;
649         wc->qp_num = IB_QP0;
650         wc->slid = slid;
651         wc->sl = 0;
652         wc->dlid_path_bits = 0;
653         wc->port_num = port_num;
654 }
655
656 /*
657  * Return 0 if SMP is to be sent
658  * Return 1 if SMP was consumed locally (whether or not solicited)
659  * Return < 0 if error
660  */
661 static int handle_outgoing_dr_smp(struct ib_mad_agent_private *mad_agent_priv,
662                                   struct ib_mad_send_wr_private *mad_send_wr)
663 {
664         int ret;
665         struct ib_smp *smp = mad_send_wr->send_buf.mad;
666         unsigned long flags;
667         struct ib_mad_local_private *local;
668         struct ib_mad_private *mad_priv;
669         struct ib_mad_port_private *port_priv;
670         struct ib_mad_agent_private *recv_mad_agent = NULL;
671         struct ib_device *device = mad_agent_priv->agent.device;
672         u8 port_num = mad_agent_priv->agent.port_num;
673         struct ib_wc mad_wc;
674         struct ib_send_wr *send_wr = &mad_send_wr->send_wr;
675
676         /*
677          * Directed route handling starts if the initial LID routed part of
678          * a request or the ending LID routed part of a response is empty.
679          * If we are at the start of the LID routed part, don't update the
680          * hop_ptr or hop_cnt.  See section 14.2.2, Vol 1 IB spec.
681          */
682         if ((ib_get_smp_direction(smp) ? smp->dr_dlid : smp->dr_slid) ==
683              IB_LID_PERMISSIVE &&
684             !smi_handle_dr_smp_send(smp, device->node_type, port_num)) {
685                 ret = -EINVAL;
686                 printk(KERN_ERR PFX "Invalid directed route\n");
687                 goto out;
688         }
689         /* Check to post send on QP or process locally */
690         ret = smi_check_local_smp(smp, device);
691         if (!ret)
692                 goto out;
693
694         local = kmalloc(sizeof *local, GFP_ATOMIC);
695         if (!local) {
696                 ret = -ENOMEM;
697                 printk(KERN_ERR PFX "No memory for ib_mad_local_private\n");
698                 goto out;
699         }
700         local->mad_priv = NULL;
701         local->recv_mad_agent = NULL;
702         mad_priv = kmem_cache_alloc(ib_mad_cache, GFP_ATOMIC);
703         if (!mad_priv) {
704                 ret = -ENOMEM;
705                 printk(KERN_ERR PFX "No memory for local response MAD\n");
706                 kfree(local);
707                 goto out;
708         }
709
710         build_smp_wc(send_wr->wr_id, be16_to_cpu(smp->dr_slid),
711                      send_wr->wr.ud.pkey_index,
712                      send_wr->wr.ud.port_num, &mad_wc);
713
714         /* No GRH for DR SMP */
715         ret = device->process_mad(device, 0, port_num, &mad_wc, NULL,
716                                   (struct ib_mad *)smp,
717                                   (struct ib_mad *)&mad_priv->mad);
718         switch (ret)
719         {
720         case IB_MAD_RESULT_SUCCESS | IB_MAD_RESULT_REPLY:
721                 if (response_mad(&mad_priv->mad.mad) &&
722                     mad_agent_priv->agent.recv_handler) {
723                         local->mad_priv = mad_priv;
724                         local->recv_mad_agent = mad_agent_priv;
725                         /*
726                          * Reference MAD agent until receive
727                          * side of local completion handled
728                          */
729                         atomic_inc(&mad_agent_priv->refcount);
730                 } else
731                         kmem_cache_free(ib_mad_cache, mad_priv);
732                 break;
733         case IB_MAD_RESULT_SUCCESS | IB_MAD_RESULT_CONSUMED:
734                 kmem_cache_free(ib_mad_cache, mad_priv);
735                 break;
736         case IB_MAD_RESULT_SUCCESS:
737                 /* Treat like an incoming receive MAD */
738                 port_priv = ib_get_mad_port(mad_agent_priv->agent.device,
739                                             mad_agent_priv->agent.port_num);
740                 if (port_priv) {
741                         mad_priv->mad.mad.mad_hdr.tid =
742                                 ((struct ib_mad *)smp)->mad_hdr.tid;
743                         recv_mad_agent = find_mad_agent(port_priv,
744                                                         &mad_priv->mad.mad);
745                 }
746                 if (!port_priv || !recv_mad_agent) {
747                         kmem_cache_free(ib_mad_cache, mad_priv);
748                         kfree(local);
749                         ret = 0;
750                         goto out;
751                 }
752                 local->mad_priv = mad_priv;
753                 local->recv_mad_agent = recv_mad_agent;
754                 break;
755         default:
756                 kmem_cache_free(ib_mad_cache, mad_priv);
757                 kfree(local);
758                 ret = -EINVAL;
759                 goto out;
760         }
761
762         local->mad_send_wr = mad_send_wr;
763         /* Reference MAD agent until send side of local completion handled */
764         atomic_inc(&mad_agent_priv->refcount);
765         /* Queue local completion to local list */
766         spin_lock_irqsave(&mad_agent_priv->lock, flags);
767         list_add_tail(&local->completion_list, &mad_agent_priv->local_list);
768         spin_unlock_irqrestore(&mad_agent_priv->lock, flags);
769         queue_work(mad_agent_priv->qp_info->port_priv->wq,
770                    &mad_agent_priv->local_work);
771         ret = 1;
772 out:
773         return ret;
774 }
775
776 static int get_pad_size(int hdr_len, int data_len)
777 {
778         int seg_size, pad;
779
780         seg_size = sizeof(struct ib_mad) - hdr_len;
781         if (data_len && seg_size) {
782                 pad = seg_size - data_len % seg_size;
783                 return pad == seg_size ? 0 : pad;
784         } else
785                 return seg_size;
786 }
787
788 static void free_send_rmpp_list(struct ib_mad_send_wr_private *mad_send_wr)
789 {
790         struct ib_rmpp_segment *s, *t;
791
792         list_for_each_entry_safe(s, t, &mad_send_wr->rmpp_list, list) {
793                 list_del(&s->list);
794                 kfree(s);
795         }
796 }
797
798 static int alloc_send_rmpp_list(struct ib_mad_send_wr_private *send_wr,
799                                 gfp_t gfp_mask)
800 {
801         struct ib_mad_send_buf *send_buf = &send_wr->send_buf;
802         struct ib_rmpp_mad *rmpp_mad = send_buf->mad;
803         struct ib_rmpp_segment *seg = NULL;
804         int left, seg_size, pad;
805
806         send_buf->seg_size = sizeof (struct ib_mad) - send_buf->hdr_len;
807         seg_size = send_buf->seg_size;
808         pad = send_wr->pad;
809
810         /* Allocate data segments. */
811         for (left = send_buf->data_len + pad; left > 0; left -= seg_size) {
812                 seg = kmalloc(sizeof (*seg) + seg_size, gfp_mask);
813                 if (!seg) {
814                         printk(KERN_ERR "alloc_send_rmpp_segs: RMPP mem "
815                                "alloc failed for len %zd, gfp %#x\n",
816                                sizeof (*seg) + seg_size, gfp_mask);
817                         free_send_rmpp_list(send_wr);
818                         return -ENOMEM;
819                 }
820                 seg->num = ++send_buf->seg_count;
821                 list_add_tail(&seg->list, &send_wr->rmpp_list);
822         }
823
824         /* Zero any padding */
825         if (pad)
826                 memset(seg->data + seg_size - pad, 0, pad);
827
828         rmpp_mad->rmpp_hdr.rmpp_version = send_wr->mad_agent_priv->
829                                           agent.rmpp_version;
830         rmpp_mad->rmpp_hdr.rmpp_type = IB_MGMT_RMPP_TYPE_DATA;
831         ib_set_rmpp_flags(&rmpp_mad->rmpp_hdr, IB_MGMT_RMPP_FLAG_ACTIVE);
832
833         send_wr->cur_seg = container_of(send_wr->rmpp_list.next,
834                                         struct ib_rmpp_segment, list);
835         send_wr->last_ack_seg = send_wr->cur_seg;
836         return 0;
837 }
838
839 struct ib_mad_send_buf * ib_create_send_mad(struct ib_mad_agent *mad_agent,
840                                             u32 remote_qpn, u16 pkey_index,
841                                             int rmpp_active,
842                                             int hdr_len, int data_len,
843                                             gfp_t gfp_mask)
844 {
845         struct ib_mad_agent_private *mad_agent_priv;
846         struct ib_mad_send_wr_private *mad_send_wr;
847         int pad, message_size, ret, size;
848         void *buf;
849
850         mad_agent_priv = container_of(mad_agent, struct ib_mad_agent_private,
851                                       agent);
852         pad = get_pad_size(hdr_len, data_len);
853         message_size = hdr_len + data_len + pad;
854
855         if ((!mad_agent->rmpp_version &&
856              (rmpp_active || message_size > sizeof(struct ib_mad))) ||
857             (!rmpp_active && message_size > sizeof(struct ib_mad)))
858                 return ERR_PTR(-EINVAL);
859
860         size = rmpp_active ? hdr_len : sizeof(struct ib_mad);
861         buf = kzalloc(sizeof *mad_send_wr + size, gfp_mask);
862         if (!buf)
863                 return ERR_PTR(-ENOMEM);
864
865         mad_send_wr = buf + size;
866         INIT_LIST_HEAD(&mad_send_wr->rmpp_list);
867         mad_send_wr->send_buf.mad = buf;
868         mad_send_wr->send_buf.hdr_len = hdr_len;
869         mad_send_wr->send_buf.data_len = data_len;
870         mad_send_wr->pad = pad;
871
872         mad_send_wr->mad_agent_priv = mad_agent_priv;
873         mad_send_wr->sg_list[0].length = hdr_len;
874         mad_send_wr->sg_list[0].lkey = mad_agent->mr->lkey;
875         mad_send_wr->sg_list[1].length = sizeof(struct ib_mad) - hdr_len;
876         mad_send_wr->sg_list[1].lkey = mad_agent->mr->lkey;
877
878         mad_send_wr->send_wr.wr_id = (unsigned long) mad_send_wr;
879         mad_send_wr->send_wr.sg_list = mad_send_wr->sg_list;
880         mad_send_wr->send_wr.num_sge = 2;
881         mad_send_wr->send_wr.opcode = IB_WR_SEND;
882         mad_send_wr->send_wr.send_flags = IB_SEND_SIGNALED;
883         mad_send_wr->send_wr.wr.ud.remote_qpn = remote_qpn;
884         mad_send_wr->send_wr.wr.ud.remote_qkey = IB_QP_SET_QKEY;
885         mad_send_wr->send_wr.wr.ud.pkey_index = pkey_index;
886
887         if (rmpp_active) {
888                 ret = alloc_send_rmpp_list(mad_send_wr, gfp_mask);
889                 if (ret) {
890                         kfree(buf);
891                         return ERR_PTR(ret);
892                 }
893         }
894
895         mad_send_wr->send_buf.mad_agent = mad_agent;
896         atomic_inc(&mad_agent_priv->refcount);
897         return &mad_send_wr->send_buf;
898 }
899 EXPORT_SYMBOL(ib_create_send_mad);
900
901 int ib_get_mad_data_offset(u8 mgmt_class)
902 {
903         if (mgmt_class == IB_MGMT_CLASS_SUBN_ADM)
904                 return IB_MGMT_SA_HDR;
905         else if ((mgmt_class == IB_MGMT_CLASS_DEVICE_MGMT) ||
906                  (mgmt_class == IB_MGMT_CLASS_DEVICE_ADM) ||
907                  (mgmt_class == IB_MGMT_CLASS_BIS))
908                 return IB_MGMT_DEVICE_HDR;
909         else if ((mgmt_class >= IB_MGMT_CLASS_VENDOR_RANGE2_START) &&
910                  (mgmt_class <= IB_MGMT_CLASS_VENDOR_RANGE2_END))
911                 return IB_MGMT_VENDOR_HDR;
912         else
913                 return IB_MGMT_MAD_HDR;
914 }
915 EXPORT_SYMBOL(ib_get_mad_data_offset);
916
917 int ib_is_mad_class_rmpp(u8 mgmt_class)
918 {
919         if ((mgmt_class == IB_MGMT_CLASS_SUBN_ADM) ||
920             (mgmt_class == IB_MGMT_CLASS_DEVICE_MGMT) ||
921             (mgmt_class == IB_MGMT_CLASS_DEVICE_ADM) ||
922             (mgmt_class == IB_MGMT_CLASS_BIS) ||
923             ((mgmt_class >= IB_MGMT_CLASS_VENDOR_RANGE2_START) &&
924              (mgmt_class <= IB_MGMT_CLASS_VENDOR_RANGE2_END)))
925                 return 1;
926         return 0;
927 }
928 EXPORT_SYMBOL(ib_is_mad_class_rmpp);
929
930 void *ib_get_rmpp_segment(struct ib_mad_send_buf *send_buf, int seg_num)
931 {
932         struct ib_mad_send_wr_private *mad_send_wr;
933         struct list_head *list;
934
935         mad_send_wr = container_of(send_buf, struct ib_mad_send_wr_private,
936                                    send_buf);
937         list = &mad_send_wr->cur_seg->list;
938
939         if (mad_send_wr->cur_seg->num < seg_num) {
940                 list_for_each_entry(mad_send_wr->cur_seg, list, list)
941                         if (mad_send_wr->cur_seg->num == seg_num)
942                                 break;
943         } else if (mad_send_wr->cur_seg->num > seg_num) {
944                 list_for_each_entry_reverse(mad_send_wr->cur_seg, list, list)
945                         if (mad_send_wr->cur_seg->num == seg_num)
946                                 break;
947         }
948         return mad_send_wr->cur_seg->data;
949 }
950 EXPORT_SYMBOL(ib_get_rmpp_segment);
951
952 static inline void *ib_get_payload(struct ib_mad_send_wr_private *mad_send_wr)
953 {
954         if (mad_send_wr->send_buf.seg_count)
955                 return ib_get_rmpp_segment(&mad_send_wr->send_buf,
956                                            mad_send_wr->seg_num);
957         else
958                 return mad_send_wr->send_buf.mad +
959                        mad_send_wr->send_buf.hdr_len;
960 }
961
962 void ib_free_send_mad(struct ib_mad_send_buf *send_buf)
963 {
964         struct ib_mad_agent_private *mad_agent_priv;
965         struct ib_mad_send_wr_private *mad_send_wr;
966
967         mad_agent_priv = container_of(send_buf->mad_agent,
968                                       struct ib_mad_agent_private, agent);
969         mad_send_wr = container_of(send_buf, struct ib_mad_send_wr_private,
970                                    send_buf);
971
972         free_send_rmpp_list(mad_send_wr);
973         kfree(send_buf->mad);
974         if (atomic_dec_and_test(&mad_agent_priv->refcount))
975                 wake_up(&mad_agent_priv->wait);
976 }
977 EXPORT_SYMBOL(ib_free_send_mad);
978
979 int ib_send_mad(struct ib_mad_send_wr_private *mad_send_wr)
980 {
981         struct ib_mad_qp_info *qp_info;
982         struct list_head *list;
983         struct ib_send_wr *bad_send_wr;
984         struct ib_mad_agent *mad_agent;
985         struct ib_sge *sge;
986         unsigned long flags;
987         int ret;
988
989         /* Set WR ID to find mad_send_wr upon completion */
990         qp_info = mad_send_wr->mad_agent_priv->qp_info;
991         mad_send_wr->send_wr.wr_id = (unsigned long)&mad_send_wr->mad_list;
992         mad_send_wr->mad_list.mad_queue = &qp_info->send_queue;
993
994         mad_agent = mad_send_wr->send_buf.mad_agent;
995         sge = mad_send_wr->sg_list;
996         sge[0].addr = dma_map_single(mad_agent->device->dma_device,
997                                      mad_send_wr->send_buf.mad,
998                                      sge[0].length,
999                                      DMA_TO_DEVICE);
1000         pci_unmap_addr_set(mad_send_wr, header_mapping, sge[0].addr);
1001
1002         sge[1].addr = dma_map_single(mad_agent->device->dma_device,
1003                                      ib_get_payload(mad_send_wr),
1004                                      sge[1].length,
1005                                      DMA_TO_DEVICE);
1006         pci_unmap_addr_set(mad_send_wr, payload_mapping, sge[1].addr);
1007
1008         spin_lock_irqsave(&qp_info->send_queue.lock, flags);
1009         if (qp_info->send_queue.count < qp_info->send_queue.max_active) {
1010                 ret = ib_post_send(mad_agent->qp, &mad_send_wr->send_wr,
1011                                    &bad_send_wr);
1012                 list = &qp_info->send_queue.list;
1013         } else {
1014                 ret = 0;
1015                 list = &qp_info->overflow_list;
1016         }
1017
1018         if (!ret) {
1019                 qp_info->send_queue.count++;
1020                 list_add_tail(&mad_send_wr->mad_list.list, list);
1021         }
1022         spin_unlock_irqrestore(&qp_info->send_queue.lock, flags);
1023         if (ret) {
1024                 dma_unmap_single(mad_agent->device->dma_device,
1025                                  pci_unmap_addr(mad_send_wr, header_mapping),
1026                                  sge[0].length, DMA_TO_DEVICE);
1027                 dma_unmap_single(mad_agent->device->dma_device,
1028                                  pci_unmap_addr(mad_send_wr, payload_mapping),
1029                                  sge[1].length, DMA_TO_DEVICE);
1030         }
1031         return ret;
1032 }
1033
1034 /*
1035  * ib_post_send_mad - Posts MAD(s) to the send queue of the QP associated
1036  *  with the registered client
1037  */
1038 int ib_post_send_mad(struct ib_mad_send_buf *send_buf,
1039                      struct ib_mad_send_buf **bad_send_buf)
1040 {
1041         struct ib_mad_agent_private *mad_agent_priv;
1042         struct ib_mad_send_buf *next_send_buf;
1043         struct ib_mad_send_wr_private *mad_send_wr;
1044         unsigned long flags;
1045         int ret = -EINVAL;
1046
1047         /* Walk list of send WRs and post each on send list */
1048         for (; send_buf; send_buf = next_send_buf) {
1049
1050                 mad_send_wr = container_of(send_buf,
1051                                            struct ib_mad_send_wr_private,
1052                                            send_buf);
1053                 mad_agent_priv = mad_send_wr->mad_agent_priv;
1054
1055                 if (!send_buf->mad_agent->send_handler ||
1056                     (send_buf->timeout_ms &&
1057                      !send_buf->mad_agent->recv_handler)) {
1058                         ret = -EINVAL;
1059                         goto error;
1060                 }
1061
1062                 if (!ib_is_mad_class_rmpp(((struct ib_mad_hdr *) send_buf->mad)->mgmt_class)) {
1063                         if (mad_agent_priv->agent.rmpp_version) {
1064                                 ret = -EINVAL;
1065                                 goto error;
1066                         }
1067                 }
1068
1069                 /*
1070                  * Save pointer to next work request to post in case the
1071                  * current one completes, and the user modifies the work
1072                  * request associated with the completion
1073                  */
1074                 next_send_buf = send_buf->next;
1075                 mad_send_wr->send_wr.wr.ud.ah = send_buf->ah;
1076
1077                 if (((struct ib_mad_hdr *) send_buf->mad)->mgmt_class ==
1078                     IB_MGMT_CLASS_SUBN_DIRECTED_ROUTE) {
1079                         ret = handle_outgoing_dr_smp(mad_agent_priv,
1080                                                      mad_send_wr);
1081                         if (ret < 0)            /* error */
1082                                 goto error;
1083                         else if (ret == 1)      /* locally consumed */
1084                                 continue;
1085                 }
1086
1087                 mad_send_wr->tid = ((struct ib_mad_hdr *) send_buf->mad)->tid;
1088                 /* Timeout will be updated after send completes */
1089                 mad_send_wr->timeout = msecs_to_jiffies(send_buf->timeout_ms);
1090                 mad_send_wr->retries = send_buf->retries;
1091                 /* Reference for work request to QP + response */
1092                 mad_send_wr->refcount = 1 + (mad_send_wr->timeout > 0);
1093                 mad_send_wr->status = IB_WC_SUCCESS;
1094
1095                 /* Reference MAD agent until send completes */
1096                 atomic_inc(&mad_agent_priv->refcount);
1097                 spin_lock_irqsave(&mad_agent_priv->lock, flags);
1098                 list_add_tail(&mad_send_wr->agent_list,
1099                               &mad_agent_priv->send_list);
1100                 spin_unlock_irqrestore(&mad_agent_priv->lock, flags);
1101
1102                 if (mad_agent_priv->agent.rmpp_version) {
1103                         ret = ib_send_rmpp_mad(mad_send_wr);
1104                         if (ret >= 0 && ret != IB_RMPP_RESULT_CONSUMED)
1105                                 ret = ib_send_mad(mad_send_wr);
1106                 } else
1107                         ret = ib_send_mad(mad_send_wr);
1108                 if (ret < 0) {
1109                         /* Fail send request */
1110                         spin_lock_irqsave(&mad_agent_priv->lock, flags);
1111                         list_del(&mad_send_wr->agent_list);
1112                         spin_unlock_irqrestore(&mad_agent_priv->lock, flags);
1113                         atomic_dec(&mad_agent_priv->refcount);
1114                         goto error;
1115                 }
1116         }
1117         return 0;
1118 error:
1119         if (bad_send_buf)
1120                 *bad_send_buf = send_buf;
1121         return ret;
1122 }
1123 EXPORT_SYMBOL(ib_post_send_mad);
1124
1125 /*
1126  * ib_free_recv_mad - Returns data buffers used to receive
1127  *  a MAD to the access layer
1128  */
1129 void ib_free_recv_mad(struct ib_mad_recv_wc *mad_recv_wc)
1130 {
1131         struct ib_mad_recv_buf *mad_recv_buf, *temp_recv_buf;
1132         struct ib_mad_private_header *mad_priv_hdr;
1133         struct ib_mad_private *priv;
1134         struct list_head free_list;
1135
1136         INIT_LIST_HEAD(&free_list);
1137         list_splice_init(&mad_recv_wc->rmpp_list, &free_list);
1138
1139         list_for_each_entry_safe(mad_recv_buf, temp_recv_buf,
1140                                         &free_list, list) {
1141                 mad_recv_wc = container_of(mad_recv_buf, struct ib_mad_recv_wc,
1142                                            recv_buf);
1143                 mad_priv_hdr = container_of(mad_recv_wc,
1144                                             struct ib_mad_private_header,
1145                                             recv_wc);
1146                 priv = container_of(mad_priv_hdr, struct ib_mad_private,
1147                                     header);
1148                 kmem_cache_free(ib_mad_cache, priv);
1149         }
1150 }
1151 EXPORT_SYMBOL(ib_free_recv_mad);
1152
1153 struct ib_mad_agent *ib_redirect_mad_qp(struct ib_qp *qp,
1154                                         u8 rmpp_version,
1155                                         ib_mad_send_handler send_handler,
1156                                         ib_mad_recv_handler recv_handler,
1157                                         void *context)
1158 {
1159         return ERR_PTR(-EINVAL);        /* XXX: for now */
1160 }
1161 EXPORT_SYMBOL(ib_redirect_mad_qp);
1162
1163 int ib_process_mad_wc(struct ib_mad_agent *mad_agent,
1164                       struct ib_wc *wc)
1165 {
1166         printk(KERN_ERR PFX "ib_process_mad_wc() not implemented yet\n");
1167         return 0;
1168 }
1169 EXPORT_SYMBOL(ib_process_mad_wc);
1170
1171 static int method_in_use(struct ib_mad_mgmt_method_table **method,
1172                          struct ib_mad_reg_req *mad_reg_req)
1173 {
1174         int i;
1175
1176         for (i = find_first_bit(mad_reg_req->method_mask, IB_MGMT_MAX_METHODS);
1177              i < IB_MGMT_MAX_METHODS;
1178              i = find_next_bit(mad_reg_req->method_mask, IB_MGMT_MAX_METHODS,
1179                                1+i)) {
1180                 if ((*method)->agent[i]) {
1181                         printk(KERN_ERR PFX "Method %d already in use\n", i);
1182                         return -EINVAL;
1183                 }
1184         }
1185         return 0;
1186 }
1187
1188 static int allocate_method_table(struct ib_mad_mgmt_method_table **method)
1189 {
1190         /* Allocate management method table */
1191         *method = kzalloc(sizeof **method, GFP_ATOMIC);
1192         if (!*method) {
1193                 printk(KERN_ERR PFX "No memory for "
1194                        "ib_mad_mgmt_method_table\n");
1195                 return -ENOMEM;
1196         }
1197
1198         return 0;
1199 }
1200
1201 /*
1202  * Check to see if there are any methods still in use
1203  */
1204 static int check_method_table(struct ib_mad_mgmt_method_table *method)
1205 {
1206         int i;
1207
1208         for (i = 0; i < IB_MGMT_MAX_METHODS; i++)
1209                 if (method->agent[i])
1210                         return 1;
1211         return 0;
1212 }
1213
1214 /*
1215  * Check to see if there are any method tables for this class still in use
1216  */
1217 static int check_class_table(struct ib_mad_mgmt_class_table *class)
1218 {
1219         int i;
1220
1221         for (i = 0; i < MAX_MGMT_CLASS; i++)
1222                 if (class->method_table[i])
1223                         return 1;
1224         return 0;
1225 }
1226
1227 static int check_vendor_class(struct ib_mad_mgmt_vendor_class *vendor_class)
1228 {
1229         int i;
1230
1231         for (i = 0; i < MAX_MGMT_OUI; i++)
1232                 if (vendor_class->method_table[i])
1233                         return 1;
1234         return 0;
1235 }
1236
1237 static int find_vendor_oui(struct ib_mad_mgmt_vendor_class *vendor_class,
1238                            char *oui)
1239 {
1240         int i;
1241
1242         for (i = 0; i < MAX_MGMT_OUI; i++)
1243                 /* Is there matching OUI for this vendor class ? */
1244                 if (!memcmp(vendor_class->oui[i], oui, 3))
1245                         return i;
1246
1247         return -1;
1248 }
1249
1250 static int check_vendor_table(struct ib_mad_mgmt_vendor_class_table *vendor)
1251 {
1252         int i;
1253
1254         for (i = 0; i < MAX_MGMT_VENDOR_RANGE2; i++)
1255                 if (vendor->vendor_class[i])
1256                         return 1;
1257
1258         return 0;
1259 }
1260
1261 static void remove_methods_mad_agent(struct ib_mad_mgmt_method_table *method,
1262                                      struct ib_mad_agent_private *agent)
1263 {
1264         int i;
1265
1266         /* Remove any methods for this mad agent */
1267         for (i = 0; i < IB_MGMT_MAX_METHODS; i++) {
1268                 if (method->agent[i] == agent) {
1269                         method->agent[i] = NULL;
1270                 }
1271         }
1272 }
1273
1274 static int add_nonoui_reg_req(struct ib_mad_reg_req *mad_reg_req,
1275                               struct ib_mad_agent_private *agent_priv,
1276                               u8 mgmt_class)
1277 {
1278         struct ib_mad_port_private *port_priv;
1279         struct ib_mad_mgmt_class_table **class;
1280         struct ib_mad_mgmt_method_table **method;
1281         int i, ret;
1282
1283         port_priv = agent_priv->qp_info->port_priv;
1284         class = &port_priv->version[mad_reg_req->mgmt_class_version].class;
1285         if (!*class) {
1286                 /* Allocate management class table for "new" class version */
1287                 *class = kzalloc(sizeof **class, GFP_ATOMIC);
1288                 if (!*class) {
1289                         printk(KERN_ERR PFX "No memory for "
1290                                "ib_mad_mgmt_class_table\n");
1291                         ret = -ENOMEM;
1292                         goto error1;
1293                 }
1294
1295                 /* Allocate method table for this management class */
1296                 method = &(*class)->method_table[mgmt_class];
1297                 if ((ret = allocate_method_table(method)))
1298                         goto error2;
1299         } else {
1300                 method = &(*class)->method_table[mgmt_class];
1301                 if (!*method) {
1302                         /* Allocate method table for this management class */
1303                         if ((ret = allocate_method_table(method)))
1304                                 goto error1;
1305                 }
1306         }
1307
1308         /* Now, make sure methods are not already in use */
1309         if (method_in_use(method, mad_reg_req))
1310                 goto error3;
1311
1312         /* Finally, add in methods being registered */
1313         for (i = find_first_bit(mad_reg_req->method_mask,
1314                                 IB_MGMT_MAX_METHODS);
1315              i < IB_MGMT_MAX_METHODS;
1316              i = find_next_bit(mad_reg_req->method_mask, IB_MGMT_MAX_METHODS,
1317                                1+i)) {
1318                 (*method)->agent[i] = agent_priv;
1319         }
1320         return 0;
1321
1322 error3:
1323         /* Remove any methods for this mad agent */
1324         remove_methods_mad_agent(*method, agent_priv);
1325         /* Now, check to see if there are any methods in use */
1326         if (!check_method_table(*method)) {
1327                 /* If not, release management method table */
1328                 kfree(*method);
1329                 *method = NULL;
1330         }
1331         ret = -EINVAL;
1332         goto error1;
1333 error2:
1334         kfree(*class);
1335         *class = NULL;
1336 error1:
1337         return ret;
1338 }
1339
1340 static int add_oui_reg_req(struct ib_mad_reg_req *mad_reg_req,
1341                            struct ib_mad_agent_private *agent_priv)
1342 {
1343         struct ib_mad_port_private *port_priv;
1344         struct ib_mad_mgmt_vendor_class_table **vendor_table;
1345         struct ib_mad_mgmt_vendor_class_table *vendor = NULL;
1346         struct ib_mad_mgmt_vendor_class *vendor_class = NULL;
1347         struct ib_mad_mgmt_method_table **method;
1348         int i, ret = -ENOMEM;
1349         u8 vclass;
1350
1351         /* "New" vendor (with OUI) class */
1352         vclass = vendor_class_index(mad_reg_req->mgmt_class);
1353         port_priv = agent_priv->qp_info->port_priv;
1354         vendor_table = &port_priv->version[
1355                                 mad_reg_req->mgmt_class_version].vendor;
1356         if (!*vendor_table) {
1357                 /* Allocate mgmt vendor class table for "new" class version */
1358                 vendor = kzalloc(sizeof *vendor, GFP_ATOMIC);
1359                 if (!vendor) {
1360                         printk(KERN_ERR PFX "No memory for "
1361                                "ib_mad_mgmt_vendor_class_table\n");
1362                         goto error1;
1363                 }
1364
1365                 *vendor_table = vendor;
1366         }
1367         if (!(*vendor_table)->vendor_class[vclass]) {
1368                 /* Allocate table for this management vendor class */
1369                 vendor_class = kzalloc(sizeof *vendor_class, GFP_ATOMIC);
1370                 if (!vendor_class) {
1371                         printk(KERN_ERR PFX "No memory for "
1372                                "ib_mad_mgmt_vendor_class\n");
1373                         goto error2;
1374                 }
1375
1376                 (*vendor_table)->vendor_class[vclass] = vendor_class;
1377         }
1378         for (i = 0; i < MAX_MGMT_OUI; i++) {
1379                 /* Is there matching OUI for this vendor class ? */
1380                 if (!memcmp((*vendor_table)->vendor_class[vclass]->oui[i],
1381                             mad_reg_req->oui, 3)) {
1382                         method = &(*vendor_table)->vendor_class[
1383                                                 vclass]->method_table[i];
1384                         BUG_ON(!*method);
1385                         goto check_in_use;
1386                 }
1387         }
1388         for (i = 0; i < MAX_MGMT_OUI; i++) {
1389                 /* OUI slot available ? */
1390                 if (!is_vendor_oui((*vendor_table)->vendor_class[
1391                                 vclass]->oui[i])) {
1392                         method = &(*vendor_table)->vendor_class[
1393                                 vclass]->method_table[i];
1394                         BUG_ON(*method);
1395                         /* Allocate method table for this OUI */
1396                         if ((ret = allocate_method_table(method)))
1397                                 goto error3;
1398                         memcpy((*vendor_table)->vendor_class[vclass]->oui[i],
1399                                mad_reg_req->oui, 3);
1400                         goto check_in_use;
1401                 }
1402         }
1403         printk(KERN_ERR PFX "All OUI slots in use\n");
1404         goto error3;
1405
1406 check_in_use:
1407         /* Now, make sure methods are not already in use */
1408         if (method_in_use(method, mad_reg_req))
1409                 goto error4;
1410
1411         /* Finally, add in methods being registered */
1412         for (i = find_first_bit(mad_reg_req->method_mask,
1413                                 IB_MGMT_MAX_METHODS);
1414              i < IB_MGMT_MAX_METHODS;
1415              i = find_next_bit(mad_reg_req->method_mask, IB_MGMT_MAX_METHODS,
1416                                1+i)) {
1417                 (*method)->agent[i] = agent_priv;
1418         }
1419         return 0;
1420
1421 error4:
1422         /* Remove any methods for this mad agent */
1423         remove_methods_mad_agent(*method, agent_priv);
1424         /* Now, check to see if there are any methods in use */
1425         if (!check_method_table(*method)) {
1426                 /* If not, release management method table */
1427                 kfree(*method);
1428                 *method = NULL;
1429         }
1430         ret = -EINVAL;
1431 error3:
1432         if (vendor_class) {
1433                 (*vendor_table)->vendor_class[vclass] = NULL;
1434                 kfree(vendor_class);
1435         }
1436 error2:
1437         if (vendor) {
1438                 *vendor_table = NULL;
1439                 kfree(vendor);
1440         }
1441 error1:
1442         return ret;
1443 }
1444
1445 static void remove_mad_reg_req(struct ib_mad_agent_private *agent_priv)
1446 {
1447         struct ib_mad_port_private *port_priv;
1448         struct ib_mad_mgmt_class_table *class;
1449         struct ib_mad_mgmt_method_table *method;
1450         struct ib_mad_mgmt_vendor_class_table *vendor;
1451         struct ib_mad_mgmt_vendor_class *vendor_class;
1452         int index;
1453         u8 mgmt_class;
1454
1455         /*
1456          * Was MAD registration request supplied
1457          * with original registration ?
1458          */
1459         if (!agent_priv->reg_req) {
1460                 goto out;
1461         }
1462
1463         port_priv = agent_priv->qp_info->port_priv;
1464         mgmt_class = convert_mgmt_class(agent_priv->reg_req->mgmt_class);
1465         class = port_priv->version[
1466                         agent_priv->reg_req->mgmt_class_version].class;
1467         if (!class)
1468                 goto vendor_check;
1469
1470         method = class->method_table[mgmt_class];
1471         if (method) {
1472                 /* Remove any methods for this mad agent */
1473                 remove_methods_mad_agent(method, agent_priv);
1474                 /* Now, check to see if there are any methods still in use */
1475                 if (!check_method_table(method)) {
1476                         /* If not, release management method table */
1477                          kfree(method);
1478                          class->method_table[mgmt_class] = NULL;
1479                          /* Any management classes left ? */
1480                         if (!check_class_table(class)) {
1481                                 /* If not, release management class table */
1482                                 kfree(class);
1483                                 port_priv->version[
1484                                         agent_priv->reg_req->
1485                                         mgmt_class_version].class = NULL;
1486                         }
1487                 }
1488         }
1489
1490 vendor_check:
1491         if (!is_vendor_class(mgmt_class))
1492                 goto out;
1493
1494         /* normalize mgmt_class to vendor range 2 */
1495         mgmt_class = vendor_class_index(agent_priv->reg_req->mgmt_class);
1496         vendor = port_priv->version[
1497                         agent_priv->reg_req->mgmt_class_version].vendor;
1498
1499         if (!vendor)
1500                 goto out;
1501
1502         vendor_class = vendor->vendor_class[mgmt_class];
1503         if (vendor_class) {
1504                 index = find_vendor_oui(vendor_class, agent_priv->reg_req->oui);
1505                 if (index < 0)
1506                         goto out;
1507                 method = vendor_class->method_table[index];
1508                 if (method) {
1509                         /* Remove any methods for this mad agent */
1510                         remove_methods_mad_agent(method, agent_priv);
1511                         /*
1512                          * Now, check to see if there are
1513                          * any methods still in use
1514                          */
1515                         if (!check_method_table(method)) {
1516                                 /* If not, release management method table */
1517                                 kfree(method);
1518                                 vendor_class->method_table[index] = NULL;
1519                                 memset(vendor_class->oui[index], 0, 3);
1520                                 /* Any OUIs left ? */
1521                                 if (!check_vendor_class(vendor_class)) {
1522                                         /* If not, release vendor class table */
1523                                         kfree(vendor_class);
1524                                         vendor->vendor_class[mgmt_class] = NULL;
1525                                         /* Any other vendor classes left ? */
1526                                         if (!check_vendor_table(vendor)) {
1527                                                 kfree(vendor);
1528                                                 port_priv->version[
1529                                                         agent_priv->reg_req->
1530                                                         mgmt_class_version].
1531                                                         vendor = NULL;
1532                                         }
1533                                 }
1534                         }
1535                 }
1536         }
1537
1538 out:
1539         return;
1540 }
1541
1542 static struct ib_mad_agent_private *
1543 find_mad_agent(struct ib_mad_port_private *port_priv,
1544                struct ib_mad *mad)
1545 {
1546         struct ib_mad_agent_private *mad_agent = NULL;
1547         unsigned long flags;
1548
1549         spin_lock_irqsave(&port_priv->reg_lock, flags);
1550         if (response_mad(mad)) {
1551                 u32 hi_tid;
1552                 struct ib_mad_agent_private *entry;
1553
1554                 /*
1555                  * Routing is based on high 32 bits of transaction ID
1556                  * of MAD.
1557                  */
1558                 hi_tid = be64_to_cpu(mad->mad_hdr.tid) >> 32;
1559                 list_for_each_entry(entry, &port_priv->agent_list, agent_list) {
1560                         if (entry->agent.hi_tid == hi_tid) {
1561                                 mad_agent = entry;
1562                                 break;
1563                         }
1564                 }
1565         } else {
1566                 struct ib_mad_mgmt_class_table *class;
1567                 struct ib_mad_mgmt_method_table *method;
1568                 struct ib_mad_mgmt_vendor_class_table *vendor;
1569                 struct ib_mad_mgmt_vendor_class *vendor_class;
1570                 struct ib_vendor_mad *vendor_mad;
1571                 int index;
1572
1573                 /*
1574                  * Routing is based on version, class, and method
1575                  * For "newer" vendor MADs, also based on OUI
1576                  */
1577                 if (mad->mad_hdr.class_version >= MAX_MGMT_VERSION)
1578                         goto out;
1579                 if (!is_vendor_class(mad->mad_hdr.mgmt_class)) {
1580                         class = port_priv->version[
1581                                         mad->mad_hdr.class_version].class;
1582                         if (!class)
1583                                 goto out;
1584                         method = class->method_table[convert_mgmt_class(
1585                                                         mad->mad_hdr.mgmt_class)];
1586                         if (method)
1587                                 mad_agent = method->agent[mad->mad_hdr.method &
1588                                                           ~IB_MGMT_METHOD_RESP];
1589                 } else {
1590                         vendor = port_priv->version[
1591                                         mad->mad_hdr.class_version].vendor;
1592                         if (!vendor)
1593                                 goto out;
1594                         vendor_class = vendor->vendor_class[vendor_class_index(
1595                                                 mad->mad_hdr.mgmt_class)];
1596                         if (!vendor_class)
1597                                 goto out;
1598                         /* Find matching OUI */
1599                         vendor_mad = (struct ib_vendor_mad *)mad;
1600                         index = find_vendor_oui(vendor_class, vendor_mad->oui);
1601                         if (index == -1)
1602                                 goto out;
1603                         method = vendor_class->method_table[index];
1604                         if (method) {
1605                                 mad_agent = method->agent[mad->mad_hdr.method &
1606                                                           ~IB_MGMT_METHOD_RESP];
1607                         }
1608                 }
1609         }
1610
1611         if (mad_agent) {
1612                 if (mad_agent->agent.recv_handler)
1613                         atomic_inc(&mad_agent->refcount);
1614                 else {
1615                         printk(KERN_NOTICE PFX "No receive handler for client "
1616                                "%p on port %d\n",
1617                                &mad_agent->agent, port_priv->port_num);
1618                         mad_agent = NULL;
1619                 }
1620         }
1621 out:
1622         spin_unlock_irqrestore(&port_priv->reg_lock, flags);
1623
1624         return mad_agent;
1625 }
1626
1627 static int validate_mad(struct ib_mad *mad, u32 qp_num)
1628 {
1629         int valid = 0;
1630
1631         /* Make sure MAD base version is understood */
1632         if (mad->mad_hdr.base_version != IB_MGMT_BASE_VERSION) {
1633                 printk(KERN_ERR PFX "MAD received with unsupported base "
1634                        "version %d\n", mad->mad_hdr.base_version);
1635                 goto out;
1636         }
1637
1638         /* Filter SMI packets sent to other than QP0 */
1639         if ((mad->mad_hdr.mgmt_class == IB_MGMT_CLASS_SUBN_LID_ROUTED) ||
1640             (mad->mad_hdr.mgmt_class == IB_MGMT_CLASS_SUBN_DIRECTED_ROUTE)) {
1641                 if (qp_num == 0)
1642                         valid = 1;
1643         } else {
1644                 /* Filter GSI packets sent to QP0 */
1645                 if (qp_num != 0)
1646                         valid = 1;
1647         }
1648
1649 out:
1650         return valid;
1651 }
1652
1653 static int is_data_mad(struct ib_mad_agent_private *mad_agent_priv,
1654                        struct ib_mad_hdr *mad_hdr)
1655 {
1656         struct ib_rmpp_mad *rmpp_mad;
1657
1658         rmpp_mad = (struct ib_rmpp_mad *)mad_hdr;
1659         return !mad_agent_priv->agent.rmpp_version ||
1660                 !(ib_get_rmpp_flags(&rmpp_mad->rmpp_hdr) &
1661                                     IB_MGMT_RMPP_FLAG_ACTIVE) ||
1662                 (rmpp_mad->rmpp_hdr.rmpp_type == IB_MGMT_RMPP_TYPE_DATA);
1663 }
1664
1665 static inline int rcv_has_same_class(struct ib_mad_send_wr_private *wr,
1666                                      struct ib_mad_recv_wc *rwc)
1667 {
1668         return ((struct ib_mad *)(wr->send_buf.mad))->mad_hdr.mgmt_class ==
1669                 rwc->recv_buf.mad->mad_hdr.mgmt_class;
1670 }
1671
1672 static inline int rcv_has_same_gid(struct ib_mad_send_wr_private *wr,
1673                                    struct ib_mad_recv_wc *rwc )
1674 {
1675         struct ib_ah_attr attr;
1676         u8 send_resp, rcv_resp;
1677
1678         send_resp = ((struct ib_mad *)(wr->send_buf.mad))->
1679                      mad_hdr.method & IB_MGMT_METHOD_RESP;
1680         rcv_resp = rwc->recv_buf.mad->mad_hdr.method & IB_MGMT_METHOD_RESP;
1681
1682         if (!send_resp && rcv_resp)
1683                 /* is request/response. GID/LIDs are both local (same). */
1684                 return 1;
1685
1686         if (send_resp == rcv_resp)
1687                 /* both requests, or both responses. GIDs different */
1688                 return 0;
1689
1690         if (ib_query_ah(wr->send_buf.ah, &attr))
1691                 /* Assume not equal, to avoid false positives. */
1692                 return 0;
1693
1694         if (!(attr.ah_flags & IB_AH_GRH) && !(rwc->wc->wc_flags & IB_WC_GRH))
1695                 return attr.dlid == rwc->wc->slid;
1696         else if ((attr.ah_flags & IB_AH_GRH) &&
1697                  (rwc->wc->wc_flags & IB_WC_GRH))
1698                 return memcmp(attr.grh.dgid.raw,
1699                               rwc->recv_buf.grh->sgid.raw, 16) == 0;
1700         else
1701                 /* one has GID, other does not.  Assume different */
1702                 return 0;
1703 }
1704 struct ib_mad_send_wr_private*
1705 ib_find_send_mad(struct ib_mad_agent_private *mad_agent_priv,
1706                  struct ib_mad_recv_wc *mad_recv_wc)
1707 {
1708         struct ib_mad_send_wr_private *mad_send_wr;
1709         struct ib_mad *mad;
1710
1711         mad = (struct ib_mad *)mad_recv_wc->recv_buf.mad;
1712
1713         list_for_each_entry(mad_send_wr, &mad_agent_priv->wait_list,
1714                             agent_list) {
1715                 if ((mad_send_wr->tid == mad->mad_hdr.tid) &&
1716                     rcv_has_same_class(mad_send_wr, mad_recv_wc) &&
1717                     rcv_has_same_gid(mad_send_wr, mad_recv_wc))
1718                         return mad_send_wr;
1719         }
1720
1721         /*
1722          * It's possible to receive the response before we've
1723          * been notified that the send has completed
1724          */
1725         list_for_each_entry(mad_send_wr, &mad_agent_priv->send_list,
1726                             agent_list) {
1727                 if (is_data_mad(mad_agent_priv, mad_send_wr->send_buf.mad) &&
1728                     mad_send_wr->tid == mad->mad_hdr.tid &&
1729                     mad_send_wr->timeout &&
1730                     rcv_has_same_class(mad_send_wr, mad_recv_wc) &&
1731                     rcv_has_same_gid(mad_send_wr, mad_recv_wc)) {
1732                         /* Verify request has not been canceled */
1733                         return (mad_send_wr->status == IB_WC_SUCCESS) ?
1734                                 mad_send_wr : NULL;
1735                 }
1736         }
1737         return NULL;
1738 }
1739
1740 void ib_mark_mad_done(struct ib_mad_send_wr_private *mad_send_wr)
1741 {
1742         mad_send_wr->timeout = 0;
1743         if (mad_send_wr->refcount == 1) {
1744                 list_del(&mad_send_wr->agent_list);
1745                 list_add_tail(&mad_send_wr->agent_list,
1746                               &mad_send_wr->mad_agent_priv->done_list);
1747         }
1748 }
1749
1750 static void ib_mad_complete_recv(struct ib_mad_agent_private *mad_agent_priv,
1751                                  struct ib_mad_recv_wc *mad_recv_wc)
1752 {
1753         struct ib_mad_send_wr_private *mad_send_wr;
1754         struct ib_mad_send_wc mad_send_wc;
1755         unsigned long flags;
1756
1757         INIT_LIST_HEAD(&mad_recv_wc->rmpp_list);
1758         list_add(&mad_recv_wc->recv_buf.list, &mad_recv_wc->rmpp_list);
1759         if (mad_agent_priv->agent.rmpp_version) {
1760                 mad_recv_wc = ib_process_rmpp_recv_wc(mad_agent_priv,
1761                                                       mad_recv_wc);
1762                 if (!mad_recv_wc) {
1763                         if (atomic_dec_and_test(&mad_agent_priv->refcount))
1764                                 wake_up(&mad_agent_priv->wait);
1765                         return;
1766                 }
1767         }
1768
1769         /* Complete corresponding request */
1770         if (response_mad(mad_recv_wc->recv_buf.mad)) {
1771                 spin_lock_irqsave(&mad_agent_priv->lock, flags);
1772                 mad_send_wr = ib_find_send_mad(mad_agent_priv, mad_recv_wc);
1773                 if (!mad_send_wr) {
1774                         spin_unlock_irqrestore(&mad_agent_priv->lock, flags);
1775                         ib_free_recv_mad(mad_recv_wc);
1776                         if (atomic_dec_and_test(&mad_agent_priv->refcount))
1777                                 wake_up(&mad_agent_priv->wait);
1778                         return;
1779                 }
1780                 ib_mark_mad_done(mad_send_wr);
1781                 spin_unlock_irqrestore(&mad_agent_priv->lock, flags);
1782
1783                 /* Defined behavior is to complete response before request */
1784                 mad_recv_wc->wc->wr_id = (unsigned long) &mad_send_wr->send_buf;
1785                 mad_agent_priv->agent.recv_handler(&mad_agent_priv->agent,
1786                                                    mad_recv_wc);
1787                 atomic_dec(&mad_agent_priv->refcount);
1788
1789                 mad_send_wc.status = IB_WC_SUCCESS;
1790                 mad_send_wc.vendor_err = 0;
1791                 mad_send_wc.send_buf = &mad_send_wr->send_buf;
1792                 ib_mad_complete_send_wr(mad_send_wr, &mad_send_wc);
1793         } else {
1794                 mad_agent_priv->agent.recv_handler(&mad_agent_priv->agent,
1795                                                    mad_recv_wc);
1796                 if (atomic_dec_and_test(&mad_agent_priv->refcount))
1797                         wake_up(&mad_agent_priv->wait);
1798         }
1799 }
1800
1801 static void ib_mad_recv_done_handler(struct ib_mad_port_private *port_priv,
1802                                      struct ib_wc *wc)
1803 {
1804         struct ib_mad_qp_info *qp_info;
1805         struct ib_mad_private_header *mad_priv_hdr;
1806         struct ib_mad_private *recv, *response;
1807         struct ib_mad_list_head *mad_list;
1808         struct ib_mad_agent_private *mad_agent;
1809
1810         response = kmem_cache_alloc(ib_mad_cache, GFP_KERNEL);
1811         if (!response)
1812                 printk(KERN_ERR PFX "ib_mad_recv_done_handler no memory "
1813                        "for response buffer\n");
1814
1815         mad_list = (struct ib_mad_list_head *)(unsigned long)wc->wr_id;
1816         qp_info = mad_list->mad_queue->qp_info;
1817         dequeue_mad(mad_list);
1818
1819         mad_priv_hdr = container_of(mad_list, struct ib_mad_private_header,
1820                                     mad_list);
1821         recv = container_of(mad_priv_hdr, struct ib_mad_private, header);
1822         dma_unmap_single(port_priv->device->dma_device,
1823                          pci_unmap_addr(&recv->header, mapping),
1824                          sizeof(struct ib_mad_private) -
1825                          sizeof(struct ib_mad_private_header),
1826                          DMA_FROM_DEVICE);
1827
1828         /* Setup MAD receive work completion from "normal" work completion */
1829         recv->header.wc = *wc;
1830         recv->header.recv_wc.wc = &recv->header.wc;
1831         recv->header.recv_wc.mad_len = sizeof(struct ib_mad);
1832         recv->header.recv_wc.recv_buf.mad = &recv->mad.mad;
1833         recv->header.recv_wc.recv_buf.grh = &recv->grh;
1834
1835         if (atomic_read(&qp_info->snoop_count))
1836                 snoop_recv(qp_info, &recv->header.recv_wc, IB_MAD_SNOOP_RECVS);
1837
1838         /* Validate MAD */
1839         if (!validate_mad(&recv->mad.mad, qp_info->qp->qp_num))
1840                 goto out;
1841
1842         if (recv->mad.mad.mad_hdr.mgmt_class ==
1843             IB_MGMT_CLASS_SUBN_DIRECTED_ROUTE) {
1844                 if (!smi_handle_dr_smp_recv(&recv->mad.smp,
1845                                             port_priv->device->node_type,
1846                                             port_priv->port_num,
1847                                             port_priv->device->phys_port_cnt))
1848                         goto out;
1849                 if (!smi_check_forward_dr_smp(&recv->mad.smp))
1850                         goto local;
1851                 if (!smi_handle_dr_smp_send(&recv->mad.smp,
1852                                             port_priv->device->node_type,
1853                                             port_priv->port_num))
1854                         goto out;
1855                 if (!smi_check_local_smp(&recv->mad.smp, port_priv->device))
1856                         goto out;
1857         }
1858
1859 local:
1860         /* Give driver "right of first refusal" on incoming MAD */
1861         if (port_priv->device->process_mad) {
1862                 int ret;
1863
1864                 if (!response) {
1865                         printk(KERN_ERR PFX "No memory for response MAD\n");
1866                         /*
1867                          * Is it better to assume that
1868                          * it wouldn't be processed ?
1869                          */
1870                         goto out;
1871                 }
1872
1873                 ret = port_priv->device->process_mad(port_priv->device, 0,
1874                                                      port_priv->port_num,
1875                                                      wc, &recv->grh,
1876                                                      &recv->mad.mad,
1877                                                      &response->mad.mad);
1878                 if (ret & IB_MAD_RESULT_SUCCESS) {
1879                         if (ret & IB_MAD_RESULT_CONSUMED)
1880                                 goto out;
1881                         if (ret & IB_MAD_RESULT_REPLY) {
1882                                 agent_send_response(&response->mad.mad,
1883                                                     &recv->grh, wc,
1884                                                     port_priv->device,
1885                                                     port_priv->port_num,
1886                                                     qp_info->qp->qp_num);
1887                                 goto out;
1888                         }
1889                 }
1890         }
1891
1892         mad_agent = find_mad_agent(port_priv, &recv->mad.mad);
1893         if (mad_agent) {
1894                 ib_mad_complete_recv(mad_agent, &recv->header.recv_wc);
1895                 /*
1896                  * recv is freed up in error cases in ib_mad_complete_recv
1897                  * or via recv_handler in ib_mad_complete_recv()
1898                  */
1899                 recv = NULL;
1900         }
1901
1902 out:
1903         /* Post another receive request for this QP */
1904         if (response) {
1905                 ib_mad_post_receive_mads(qp_info, response);
1906                 if (recv)
1907                         kmem_cache_free(ib_mad_cache, recv);
1908         } else
1909                 ib_mad_post_receive_mads(qp_info, recv);
1910 }
1911
1912 static void adjust_timeout(struct ib_mad_agent_private *mad_agent_priv)
1913 {
1914         struct ib_mad_send_wr_private *mad_send_wr;
1915         unsigned long delay;
1916
1917         if (list_empty(&mad_agent_priv->wait_list)) {
1918                 cancel_delayed_work(&mad_agent_priv->timed_work);
1919         } else {
1920                 mad_send_wr = list_entry(mad_agent_priv->wait_list.next,
1921                                          struct ib_mad_send_wr_private,
1922                                          agent_list);
1923
1924                 if (time_after(mad_agent_priv->timeout,
1925                                mad_send_wr->timeout)) {
1926                         mad_agent_priv->timeout = mad_send_wr->timeout;
1927                         cancel_delayed_work(&mad_agent_priv->timed_work);
1928                         delay = mad_send_wr->timeout - jiffies;
1929                         if ((long)delay <= 0)
1930                                 delay = 1;
1931                         queue_delayed_work(mad_agent_priv->qp_info->
1932                                            port_priv->wq,
1933                                            &mad_agent_priv->timed_work, delay);
1934                 }
1935         }
1936 }
1937
1938 static void wait_for_response(struct ib_mad_send_wr_private *mad_send_wr)
1939 {
1940         struct ib_mad_agent_private *mad_agent_priv;
1941         struct ib_mad_send_wr_private *temp_mad_send_wr;
1942         struct list_head *list_item;
1943         unsigned long delay;
1944
1945         mad_agent_priv = mad_send_wr->mad_agent_priv;
1946         list_del(&mad_send_wr->agent_list);
1947
1948         delay = mad_send_wr->timeout;
1949         mad_send_wr->timeout += jiffies;
1950
1951         if (delay) {
1952                 list_for_each_prev(list_item, &mad_agent_priv->wait_list) {
1953                         temp_mad_send_wr = list_entry(list_item,
1954                                                 struct ib_mad_send_wr_private,
1955                                                 agent_list);
1956                         if (time_after(mad_send_wr->timeout,
1957                                        temp_mad_send_wr->timeout))
1958                                 break;
1959                 }
1960         }
1961         else
1962                 list_item = &mad_agent_priv->wait_list;
1963         list_add(&mad_send_wr->agent_list, list_item);
1964
1965         /* Reschedule a work item if we have a shorter timeout */
1966         if (mad_agent_priv->wait_list.next == &mad_send_wr->agent_list) {
1967                 cancel_delayed_work(&mad_agent_priv->timed_work);
1968                 queue_delayed_work(mad_agent_priv->qp_info->port_priv->wq,
1969                                    &mad_agent_priv->timed_work, delay);
1970         }
1971 }
1972
1973 void ib_reset_mad_timeout(struct ib_mad_send_wr_private *mad_send_wr,
1974                           int timeout_ms)
1975 {
1976         mad_send_wr->timeout = msecs_to_jiffies(timeout_ms);
1977         wait_for_response(mad_send_wr);
1978 }
1979
1980 /*
1981  * Process a send work completion
1982  */
1983 void ib_mad_complete_send_wr(struct ib_mad_send_wr_private *mad_send_wr,
1984                              struct ib_mad_send_wc *mad_send_wc)
1985 {
1986         struct ib_mad_agent_private     *mad_agent_priv;
1987         unsigned long                   flags;
1988         int                             ret;
1989
1990         mad_agent_priv = mad_send_wr->mad_agent_priv;
1991         spin_lock_irqsave(&mad_agent_priv->lock, flags);
1992         if (mad_agent_priv->agent.rmpp_version) {
1993                 ret = ib_process_rmpp_send_wc(mad_send_wr, mad_send_wc);
1994                 if (ret == IB_RMPP_RESULT_CONSUMED)
1995                         goto done;
1996         } else
1997                 ret = IB_RMPP_RESULT_UNHANDLED;
1998
1999         if (mad_send_wc->status != IB_WC_SUCCESS &&
2000             mad_send_wr->status == IB_WC_SUCCESS) {
2001                 mad_send_wr->status = mad_send_wc->status;
2002                 mad_send_wr->refcount -= (mad_send_wr->timeout > 0);
2003         }
2004
2005         if (--mad_send_wr->refcount > 0) {
2006                 if (mad_send_wr->refcount == 1 && mad_send_wr->timeout &&
2007                     mad_send_wr->status == IB_WC_SUCCESS) {
2008                         wait_for_response(mad_send_wr);
2009                 }
2010                 goto done;
2011         }
2012
2013         /* Remove send from MAD agent and notify client of completion */
2014         list_del(&mad_send_wr->agent_list);
2015         adjust_timeout(mad_agent_priv);
2016         spin_unlock_irqrestore(&mad_agent_priv->lock, flags);
2017
2018         if (mad_send_wr->status != IB_WC_SUCCESS )
2019                 mad_send_wc->status = mad_send_wr->status;
2020         if (ret == IB_RMPP_RESULT_INTERNAL)
2021                 ib_rmpp_send_handler(mad_send_wc);
2022         else
2023                 mad_agent_priv->agent.send_handler(&mad_agent_priv->agent,
2024                                                    mad_send_wc);
2025
2026         /* Release reference on agent taken when sending */
2027         if (atomic_dec_and_test(&mad_agent_priv->refcount))
2028                 wake_up(&mad_agent_priv->wait);
2029         return;
2030 done:
2031         spin_unlock_irqrestore(&mad_agent_priv->lock, flags);
2032 }
2033
2034 static void ib_mad_send_done_handler(struct ib_mad_port_private *port_priv,
2035                                      struct ib_wc *wc)
2036 {
2037         struct ib_mad_send_wr_private   *mad_send_wr, *queued_send_wr;
2038         struct ib_mad_list_head         *mad_list;
2039         struct ib_mad_qp_info           *qp_info;
2040         struct ib_mad_queue             *send_queue;
2041         struct ib_send_wr               *bad_send_wr;
2042         struct ib_mad_send_wc           mad_send_wc;
2043         unsigned long flags;
2044         int ret;
2045
2046         mad_list = (struct ib_mad_list_head *)(unsigned long)wc->wr_id;
2047         mad_send_wr = container_of(mad_list, struct ib_mad_send_wr_private,
2048                                    mad_list);
2049         send_queue = mad_list->mad_queue;
2050         qp_info = send_queue->qp_info;
2051
2052 retry:
2053         dma_unmap_single(mad_send_wr->send_buf.mad_agent->device->dma_device,
2054                          pci_unmap_addr(mad_send_wr, header_mapping),
2055                          mad_send_wr->sg_list[0].length, DMA_TO_DEVICE);
2056         dma_unmap_single(mad_send_wr->send_buf.mad_agent->device->dma_device,
2057                          pci_unmap_addr(mad_send_wr, payload_mapping),
2058                          mad_send_wr->sg_list[1].length, DMA_TO_DEVICE);
2059         queued_send_wr = NULL;
2060         spin_lock_irqsave(&send_queue->lock, flags);
2061         list_del(&mad_list->list);
2062
2063         /* Move queued send to the send queue */
2064         if (send_queue->count-- > send_queue->max_active) {
2065                 mad_list = container_of(qp_info->overflow_list.next,
2066                                         struct ib_mad_list_head, list);
2067                 queued_send_wr = container_of(mad_list,
2068                                         struct ib_mad_send_wr_private,
2069                                         mad_list);
2070                 list_del(&mad_list->list);
2071                 list_add_tail(&mad_list->list, &send_queue->list);
2072         }
2073         spin_unlock_irqrestore(&send_queue->lock, flags);
2074
2075         mad_send_wc.send_buf = &mad_send_wr->send_buf;
2076         mad_send_wc.status = wc->status;
2077         mad_send_wc.vendor_err = wc->vendor_err;
2078         if (atomic_read(&qp_info->snoop_count))
2079                 snoop_send(qp_info, &mad_send_wr->send_buf, &mad_send_wc,
2080                            IB_MAD_SNOOP_SEND_COMPLETIONS);
2081         ib_mad_complete_send_wr(mad_send_wr, &mad_send_wc);
2082
2083         if (queued_send_wr) {
2084                 ret = ib_post_send(qp_info->qp, &queued_send_wr->send_wr,
2085                                    &bad_send_wr);
2086                 if (ret) {
2087                         printk(KERN_ERR PFX "ib_post_send failed: %d\n", ret);
2088                         mad_send_wr = queued_send_wr;
2089                         wc->status = IB_WC_LOC_QP_OP_ERR;
2090                         goto retry;
2091                 }
2092         }
2093 }
2094
2095 static void mark_sends_for_retry(struct ib_mad_qp_info *qp_info)
2096 {
2097         struct ib_mad_send_wr_private *mad_send_wr;
2098         struct ib_mad_list_head *mad_list;
2099         unsigned long flags;
2100
2101         spin_lock_irqsave(&qp_info->send_queue.lock, flags);
2102         list_for_each_entry(mad_list, &qp_info->send_queue.list, list) {
2103                 mad_send_wr = container_of(mad_list,
2104                                            struct ib_mad_send_wr_private,
2105                                            mad_list);
2106                 mad_send_wr->retry = 1;
2107         }
2108         spin_unlock_irqrestore(&qp_info->send_queue.lock, flags);
2109 }
2110
2111 static void mad_error_handler(struct ib_mad_port_private *port_priv,
2112                               struct ib_wc *wc)
2113 {
2114         struct ib_mad_list_head *mad_list;
2115         struct ib_mad_qp_info *qp_info;
2116         struct ib_mad_send_wr_private *mad_send_wr;
2117         int ret;
2118
2119         /* Determine if failure was a send or receive */
2120         mad_list = (struct ib_mad_list_head *)(unsigned long)wc->wr_id;
2121         qp_info = mad_list->mad_queue->qp_info;
2122         if (mad_list->mad_queue == &qp_info->recv_queue)
2123                 /*
2124                  * Receive errors indicate that the QP has entered the error
2125                  * state - error handling/shutdown code will cleanup
2126                  */
2127                 return;
2128
2129         /*
2130          * Send errors will transition the QP to SQE - move
2131          * QP to RTS and repost flushed work requests
2132          */
2133         mad_send_wr = container_of(mad_list, struct ib_mad_send_wr_private,
2134                                    mad_list);
2135         if (wc->status == IB_WC_WR_FLUSH_ERR) {
2136                 if (mad_send_wr->retry) {
2137                         /* Repost send */
2138                         struct ib_send_wr *bad_send_wr;
2139
2140                         mad_send_wr->retry = 0;
2141                         ret = ib_post_send(qp_info->qp, &mad_send_wr->send_wr,
2142                                         &bad_send_wr);
2143                         if (ret)
2144                                 ib_mad_send_done_handler(port_priv, wc);
2145                 } else
2146                         ib_mad_send_done_handler(port_priv, wc);
2147         } else {
2148                 struct ib_qp_attr *attr;
2149
2150                 /* Transition QP to RTS and fail offending send */
2151                 attr = kmalloc(sizeof *attr, GFP_KERNEL);
2152                 if (attr) {
2153                         attr->qp_state = IB_QPS_RTS;
2154                         attr->cur_qp_state = IB_QPS_SQE;
2155                         ret = ib_modify_qp(qp_info->qp, attr,
2156                                            IB_QP_STATE | IB_QP_CUR_STATE);
2157                         kfree(attr);
2158                         if (ret)
2159                                 printk(KERN_ERR PFX "mad_error_handler - "
2160                                        "ib_modify_qp to RTS : %d\n", ret);
2161                         else
2162                                 mark_sends_for_retry(qp_info);
2163                 }
2164                 ib_mad_send_done_handler(port_priv, wc);
2165         }
2166 }
2167
2168 /*
2169  * IB MAD completion callback
2170  */
2171 static void ib_mad_completion_handler(void *data)
2172 {
2173         struct ib_mad_port_private *port_priv;
2174         struct ib_wc wc;
2175
2176         port_priv = (struct ib_mad_port_private *)data;
2177         ib_req_notify_cq(port_priv->cq, IB_CQ_NEXT_COMP);
2178
2179         while (ib_poll_cq(port_priv->cq, 1, &wc) == 1) {
2180                 if (wc.status == IB_WC_SUCCESS) {
2181                         switch (wc.opcode) {
2182                         case IB_WC_SEND:
2183                                 ib_mad_send_done_handler(port_priv, &wc);
2184                                 break;
2185                         case IB_WC_RECV:
2186                                 ib_mad_recv_done_handler(port_priv, &wc);
2187                                 break;
2188                         default:
2189                                 BUG_ON(1);
2190                                 break;
2191                         }
2192                 } else
2193                         mad_error_handler(port_priv, &wc);
2194         }
2195 }
2196
2197 static void cancel_mads(struct ib_mad_agent_private *mad_agent_priv)
2198 {
2199         unsigned long flags;
2200         struct ib_mad_send_wr_private *mad_send_wr, *temp_mad_send_wr;
2201         struct ib_mad_send_wc mad_send_wc;
2202         struct list_head cancel_list;
2203
2204         INIT_LIST_HEAD(&cancel_list);
2205
2206         spin_lock_irqsave(&mad_agent_priv->lock, flags);
2207         list_for_each_entry_safe(mad_send_wr, temp_mad_send_wr,
2208                                  &mad_agent_priv->send_list, agent_list) {
2209                 if (mad_send_wr->status == IB_WC_SUCCESS) {
2210                         mad_send_wr->status = IB_WC_WR_FLUSH_ERR;
2211                         mad_send_wr->refcount -= (mad_send_wr->timeout > 0);
2212                 }
2213         }
2214
2215         /* Empty wait list to prevent receives from finding a request */
2216         list_splice_init(&mad_agent_priv->wait_list, &cancel_list);
2217         /* Empty local completion list as well */
2218         list_splice_init(&mad_agent_priv->local_list, &cancel_list);
2219         spin_unlock_irqrestore(&mad_agent_priv->lock, flags);
2220
2221         /* Report all cancelled requests */
2222         mad_send_wc.status = IB_WC_WR_FLUSH_ERR;
2223         mad_send_wc.vendor_err = 0;
2224
2225         list_for_each_entry_safe(mad_send_wr, temp_mad_send_wr,
2226                                  &cancel_list, agent_list) {
2227                 mad_send_wc.send_buf = &mad_send_wr->send_buf;
2228                 list_del(&mad_send_wr->agent_list);
2229                 mad_agent_priv->agent.send_handler(&mad_agent_priv->agent,
2230                                                    &mad_send_wc);
2231                 atomic_dec(&mad_agent_priv->refcount);
2232         }
2233 }
2234
2235 static struct ib_mad_send_wr_private*
2236 find_send_wr(struct ib_mad_agent_private *mad_agent_priv,
2237              struct ib_mad_send_buf *send_buf)
2238 {
2239         struct ib_mad_send_wr_private *mad_send_wr;
2240
2241         list_for_each_entry(mad_send_wr, &mad_agent_priv->wait_list,
2242                             agent_list) {
2243                 if (&mad_send_wr->send_buf == send_buf)
2244                         return mad_send_wr;
2245         }
2246
2247         list_for_each_entry(mad_send_wr, &mad_agent_priv->send_list,
2248                             agent_list) {
2249                 if (is_data_mad(mad_agent_priv, mad_send_wr->send_buf.mad) &&
2250                     &mad_send_wr->send_buf == send_buf)
2251                         return mad_send_wr;
2252         }
2253         return NULL;
2254 }
2255
2256 int ib_modify_mad(struct ib_mad_agent *mad_agent,
2257                   struct ib_mad_send_buf *send_buf, u32 timeout_ms)
2258 {
2259         struct ib_mad_agent_private *mad_agent_priv;
2260         struct ib_mad_send_wr_private *mad_send_wr;
2261         unsigned long flags;
2262         int active;
2263
2264         mad_agent_priv = container_of(mad_agent, struct ib_mad_agent_private,
2265                                       agent);
2266         spin_lock_irqsave(&mad_agent_priv->lock, flags);
2267         mad_send_wr = find_send_wr(mad_agent_priv, send_buf);
2268         if (!mad_send_wr || mad_send_wr->status != IB_WC_SUCCESS) {
2269                 spin_unlock_irqrestore(&mad_agent_priv->lock, flags);
2270                 return -EINVAL;
2271         }
2272
2273         active = (!mad_send_wr->timeout || mad_send_wr->refcount > 1);
2274         if (!timeout_ms) {
2275                 mad_send_wr->status = IB_WC_WR_FLUSH_ERR;
2276                 mad_send_wr->refcount -= (mad_send_wr->timeout > 0);
2277         }
2278
2279         mad_send_wr->send_buf.timeout_ms = timeout_ms;
2280         if (active)
2281                 mad_send_wr->timeout = msecs_to_jiffies(timeout_ms);
2282         else
2283                 ib_reset_mad_timeout(mad_send_wr, timeout_ms);
2284
2285         spin_unlock_irqrestore(&mad_agent_priv->lock, flags);
2286         return 0;
2287 }
2288 EXPORT_SYMBOL(ib_modify_mad);
2289
2290 void ib_cancel_mad(struct ib_mad_agent *mad_agent,
2291                    struct ib_mad_send_buf *send_buf)
2292 {
2293         ib_modify_mad(mad_agent, send_buf, 0);
2294 }
2295 EXPORT_SYMBOL(ib_cancel_mad);
2296
2297 static void local_completions(void *data)
2298 {
2299         struct ib_mad_agent_private *mad_agent_priv;
2300         struct ib_mad_local_private *local;
2301         struct ib_mad_agent_private *recv_mad_agent;
2302         unsigned long flags;
2303         int recv = 0;
2304         struct ib_wc wc;
2305         struct ib_mad_send_wc mad_send_wc;
2306
2307         mad_agent_priv = (struct ib_mad_agent_private *)data;
2308
2309         spin_lock_irqsave(&mad_agent_priv->lock, flags);
2310         while (!list_empty(&mad_agent_priv->local_list)) {
2311                 local = list_entry(mad_agent_priv->local_list.next,
2312                                    struct ib_mad_local_private,
2313                                    completion_list);
2314                 spin_unlock_irqrestore(&mad_agent_priv->lock, flags);
2315                 if (local->mad_priv) {
2316                         recv_mad_agent = local->recv_mad_agent;
2317                         if (!recv_mad_agent) {
2318                                 printk(KERN_ERR PFX "No receive MAD agent for local completion\n");
2319                                 goto local_send_completion;
2320                         }
2321
2322                         recv = 1;
2323                         /*
2324                          * Defined behavior is to complete response
2325                          * before request
2326                          */
2327                         build_smp_wc((unsigned long) local->mad_send_wr,
2328                                      be16_to_cpu(IB_LID_PERMISSIVE),
2329                                      0, recv_mad_agent->agent.port_num, &wc);
2330
2331                         local->mad_priv->header.recv_wc.wc = &wc;
2332                         local->mad_priv->header.recv_wc.mad_len =
2333                                                 sizeof(struct ib_mad);
2334                         INIT_LIST_HEAD(&local->mad_priv->header.recv_wc.rmpp_list);
2335                         list_add(&local->mad_priv->header.recv_wc.recv_buf.list,
2336                                  &local->mad_priv->header.recv_wc.rmpp_list);
2337                         local->mad_priv->header.recv_wc.recv_buf.grh = NULL;
2338                         local->mad_priv->header.recv_wc.recv_buf.mad =
2339                                                 &local->mad_priv->mad.mad;
2340                         if (atomic_read(&recv_mad_agent->qp_info->snoop_count))
2341                                 snoop_recv(recv_mad_agent->qp_info,
2342                                           &local->mad_priv->header.recv_wc,
2343                                            IB_MAD_SNOOP_RECVS);
2344                         recv_mad_agent->agent.recv_handler(
2345                                                 &recv_mad_agent->agent,
2346                                                 &local->mad_priv->header.recv_wc);
2347                         spin_lock_irqsave(&recv_mad_agent->lock, flags);
2348                         atomic_dec(&recv_mad_agent->refcount);
2349                         spin_unlock_irqrestore(&recv_mad_agent->lock, flags);
2350                 }
2351
2352 local_send_completion:
2353                 /* Complete send */
2354                 mad_send_wc.status = IB_WC_SUCCESS;
2355                 mad_send_wc.vendor_err = 0;
2356                 mad_send_wc.send_buf = &local->mad_send_wr->send_buf;
2357                 if (atomic_read(&mad_agent_priv->qp_info->snoop_count))
2358                         snoop_send(mad_agent_priv->qp_info,
2359                                    &local->mad_send_wr->send_buf,
2360                                    &mad_send_wc, IB_MAD_SNOOP_SEND_COMPLETIONS);
2361                 mad_agent_priv->agent.send_handler(&mad_agent_priv->agent,
2362                                                    &mad_send_wc);
2363
2364                 spin_lock_irqsave(&mad_agent_priv->lock, flags);
2365                 list_del(&local->completion_list);
2366                 atomic_dec(&mad_agent_priv->refcount);
2367                 if (!recv)
2368                         kmem_cache_free(ib_mad_cache, local->mad_priv);
2369                 kfree(local);
2370         }
2371         spin_unlock_irqrestore(&mad_agent_priv->lock, flags);
2372 }
2373
2374 static int retry_send(struct ib_mad_send_wr_private *mad_send_wr)
2375 {
2376         int ret;
2377
2378         if (!mad_send_wr->retries--)
2379                 return -ETIMEDOUT;
2380
2381         mad_send_wr->timeout = msecs_to_jiffies(mad_send_wr->send_buf.timeout_ms);
2382
2383         if (mad_send_wr->mad_agent_priv->agent.rmpp_version) {
2384                 ret = ib_retry_rmpp(mad_send_wr);
2385                 switch (ret) {
2386                 case IB_RMPP_RESULT_UNHANDLED:
2387                         ret = ib_send_mad(mad_send_wr);
2388                         break;
2389                 case IB_RMPP_RESULT_CONSUMED:
2390                         ret = 0;
2391                         break;
2392                 default:
2393                         ret = -ECOMM;
2394                         break;
2395                 }
2396         } else
2397                 ret = ib_send_mad(mad_send_wr);
2398
2399         if (!ret) {
2400                 mad_send_wr->refcount++;
2401                 list_add_tail(&mad_send_wr->agent_list,
2402                               &mad_send_wr->mad_agent_priv->send_list);
2403         }
2404         return ret;
2405 }
2406
2407 static void timeout_sends(void *data)
2408 {
2409         struct ib_mad_agent_private *mad_agent_priv;
2410         struct ib_mad_send_wr_private *mad_send_wr;
2411         struct ib_mad_send_wc mad_send_wc;
2412         unsigned long flags, delay;
2413
2414         mad_agent_priv = (struct ib_mad_agent_private *)data;
2415         mad_send_wc.vendor_err = 0;
2416
2417         spin_lock_irqsave(&mad_agent_priv->lock, flags);
2418         while (!list_empty(&mad_agent_priv->wait_list)) {
2419                 mad_send_wr = list_entry(mad_agent_priv->wait_list.next,
2420                                          struct ib_mad_send_wr_private,
2421                                          agent_list);
2422
2423                 if (time_after(mad_send_wr->timeout, jiffies)) {
2424                         delay = mad_send_wr->timeout - jiffies;
2425                         if ((long)delay <= 0)
2426                                 delay = 1;
2427                         queue_delayed_work(mad_agent_priv->qp_info->
2428                                            port_priv->wq,
2429                                            &mad_agent_priv->timed_work, delay);
2430                         break;
2431                 }
2432
2433                 list_del(&mad_send_wr->agent_list);
2434                 if (mad_send_wr->status == IB_WC_SUCCESS &&
2435                     !retry_send(mad_send_wr))
2436                         continue;
2437
2438                 spin_unlock_irqrestore(&mad_agent_priv->lock, flags);
2439
2440                 if (mad_send_wr->status == IB_WC_SUCCESS)
2441                         mad_send_wc.status = IB_WC_RESP_TIMEOUT_ERR;
2442                 else
2443                         mad_send_wc.status = mad_send_wr->status;
2444                 mad_send_wc.send_buf = &mad_send_wr->send_buf;
2445                 mad_agent_priv->agent.send_handler(&mad_agent_priv->agent,
2446                                                    &mad_send_wc);
2447
2448                 atomic_dec(&mad_agent_priv->refcount);
2449                 spin_lock_irqsave(&mad_agent_priv->lock, flags);
2450         }
2451         spin_unlock_irqrestore(&mad_agent_priv->lock, flags);
2452 }
2453
2454 static void ib_mad_thread_completion_handler(struct ib_cq *cq, void *arg)
2455 {
2456         struct ib_mad_port_private *port_priv = cq->cq_context;
2457         unsigned long flags;
2458
2459         spin_lock_irqsave(&ib_mad_port_list_lock, flags);
2460         if (!list_empty(&port_priv->port_list))
2461                 queue_work(port_priv->wq, &port_priv->work);
2462         spin_unlock_irqrestore(&ib_mad_port_list_lock, flags);
2463 }
2464
2465 /*
2466  * Allocate receive MADs and post receive WRs for them
2467  */
2468 static int ib_mad_post_receive_mads(struct ib_mad_qp_info *qp_info,
2469                                     struct ib_mad_private *mad)
2470 {
2471         unsigned long flags;
2472         int post, ret;
2473         struct ib_mad_private *mad_priv;
2474         struct ib_sge sg_list;
2475         struct ib_recv_wr recv_wr, *bad_recv_wr;
2476         struct ib_mad_queue *recv_queue = &qp_info->recv_queue;
2477
2478         /* Initialize common scatter list fields */
2479         sg_list.length = sizeof *mad_priv - sizeof mad_priv->header;
2480         sg_list.lkey = (*qp_info->port_priv->mr).lkey;
2481
2482         /* Initialize common receive WR fields */
2483         recv_wr.next = NULL;
2484         recv_wr.sg_list = &sg_list;
2485         recv_wr.num_sge = 1;
2486
2487         do {
2488                 /* Allocate and map receive buffer */
2489                 if (mad) {
2490                         mad_priv = mad;
2491                         mad = NULL;
2492                 } else {
2493                         mad_priv = kmem_cache_alloc(ib_mad_cache, GFP_KERNEL);
2494                         if (!mad_priv) {
2495                                 printk(KERN_ERR PFX "No memory for receive buffer\n");
2496                                 ret = -ENOMEM;
2497                                 break;
2498                         }
2499                 }
2500                 sg_list.addr = dma_map_single(qp_info->port_priv->
2501                                                 device->dma_device,
2502                                               &mad_priv->grh,
2503                                               sizeof *mad_priv -
2504                                                 sizeof mad_priv->header,
2505                                               DMA_FROM_DEVICE);
2506                 pci_unmap_addr_set(&mad_priv->header, mapping, sg_list.addr);
2507                 recv_wr.wr_id = (unsigned long)&mad_priv->header.mad_list;
2508                 mad_priv->header.mad_list.mad_queue = recv_queue;
2509
2510                 /* Post receive WR */
2511                 spin_lock_irqsave(&recv_queue->lock, flags);
2512                 post = (++recv_queue->count < recv_queue->max_active);
2513                 list_add_tail(&mad_priv->header.mad_list.list, &recv_queue->list);
2514                 spin_unlock_irqrestore(&recv_queue->lock, flags);
2515                 ret = ib_post_recv(qp_info->qp, &recv_wr, &bad_recv_wr);
2516                 if (ret) {
2517                         spin_lock_irqsave(&recv_queue->lock, flags);
2518                         list_del(&mad_priv->header.mad_list.list);
2519                         recv_queue->count--;
2520                         spin_unlock_irqrestore(&recv_queue->lock, flags);
2521                         dma_unmap_single(qp_info->port_priv->device->dma_device,
2522                                          pci_unmap_addr(&mad_priv->header,
2523                                                         mapping),
2524                                          sizeof *mad_priv -
2525                                            sizeof mad_priv->header,
2526                                          DMA_FROM_DEVICE);
2527                         kmem_cache_free(ib_mad_cache, mad_priv);
2528                         printk(KERN_ERR PFX "ib_post_recv failed: %d\n", ret);
2529                         break;
2530                 }
2531         } while (post);
2532
2533         return ret;
2534 }
2535
2536 /*
2537  * Return all the posted receive MADs
2538  */
2539 static void cleanup_recv_queue(struct ib_mad_qp_info *qp_info)
2540 {
2541         struct ib_mad_private_header *mad_priv_hdr;
2542         struct ib_mad_private *recv;
2543         struct ib_mad_list_head *mad_list;
2544
2545         while (!list_empty(&qp_info->recv_queue.list)) {
2546
2547                 mad_list = list_entry(qp_info->recv_queue.list.next,
2548                                       struct ib_mad_list_head, list);
2549                 mad_priv_hdr = container_of(mad_list,
2550                                             struct ib_mad_private_header,
2551                                             mad_list);
2552                 recv = container_of(mad_priv_hdr, struct ib_mad_private,
2553                                     header);
2554
2555                 /* Remove from posted receive MAD list */
2556                 list_del(&mad_list->list);
2557
2558                 dma_unmap_single(qp_info->port_priv->device->dma_device,
2559                                  pci_unmap_addr(&recv->header, mapping),
2560                                  sizeof(struct ib_mad_private) -
2561                                  sizeof(struct ib_mad_private_header),
2562                                  DMA_FROM_DEVICE);
2563                 kmem_cache_free(ib_mad_cache, recv);
2564         }
2565
2566         qp_info->recv_queue.count = 0;
2567 }
2568
2569 /*
2570  * Start the port
2571  */
2572 static int ib_mad_port_start(struct ib_mad_port_private *port_priv)
2573 {
2574         int ret, i;
2575         struct ib_qp_attr *attr;
2576         struct ib_qp *qp;
2577
2578         attr = kmalloc(sizeof *attr, GFP_KERNEL);
2579         if (!attr) {
2580                 printk(KERN_ERR PFX "Couldn't kmalloc ib_qp_attr\n");
2581                 return -ENOMEM;
2582         }
2583
2584         for (i = 0; i < IB_MAD_QPS_CORE; i++) {
2585                 qp = port_priv->qp_info[i].qp;
2586                 /*
2587                  * PKey index for QP1 is irrelevant but
2588                  * one is needed for the Reset to Init transition
2589                  */
2590                 attr->qp_state = IB_QPS_INIT;
2591                 attr->pkey_index = 0;
2592                 attr->qkey = (qp->qp_num == 0) ? 0 : IB_QP1_QKEY;
2593                 ret = ib_modify_qp(qp, attr, IB_QP_STATE |
2594                                              IB_QP_PKEY_INDEX | IB_QP_QKEY);
2595                 if (ret) {
2596                         printk(KERN_ERR PFX "Couldn't change QP%d state to "
2597                                "INIT: %d\n", i, ret);
2598                         goto out;
2599                 }
2600
2601                 attr->qp_state = IB_QPS_RTR;
2602                 ret = ib_modify_qp(qp, attr, IB_QP_STATE);
2603                 if (ret) {
2604                         printk(KERN_ERR PFX "Couldn't change QP%d state to "
2605                                "RTR: %d\n", i, ret);
2606                         goto out;
2607                 }
2608
2609                 attr->qp_state = IB_QPS_RTS;
2610                 attr->sq_psn = IB_MAD_SEND_Q_PSN;
2611                 ret = ib_modify_qp(qp, attr, IB_QP_STATE | IB_QP_SQ_PSN);
2612                 if (ret) {
2613                         printk(KERN_ERR PFX "Couldn't change QP%d state to "
2614                                "RTS: %d\n", i, ret);
2615                         goto out;
2616                 }
2617         }
2618
2619         ret = ib_req_notify_cq(port_priv->cq, IB_CQ_NEXT_COMP);
2620         if (ret) {
2621                 printk(KERN_ERR PFX "Failed to request completion "
2622                        "notification: %d\n", ret);
2623                 goto out;
2624         }
2625
2626         for (i = 0; i < IB_MAD_QPS_CORE; i++) {
2627                 ret = ib_mad_post_receive_mads(&port_priv->qp_info[i], NULL);
2628                 if (ret) {
2629                         printk(KERN_ERR PFX "Couldn't post receive WRs\n");
2630                         goto out;
2631                 }
2632         }
2633 out:
2634         kfree(attr);
2635         return ret;
2636 }
2637
2638 static void qp_event_handler(struct ib_event *event, void *qp_context)
2639 {
2640         struct ib_mad_qp_info   *qp_info = qp_context;
2641
2642         /* It's worse than that! He's dead, Jim! */
2643         printk(KERN_ERR PFX "Fatal error (%d) on MAD QP (%d)\n",
2644                 event->event, qp_info->qp->qp_num);
2645 }
2646
2647 static void init_mad_queue(struct ib_mad_qp_info *qp_info,
2648                            struct ib_mad_queue *mad_queue)
2649 {
2650         mad_queue->qp_info = qp_info;
2651         mad_queue->count = 0;
2652         spin_lock_init(&mad_queue->lock);
2653         INIT_LIST_HEAD(&mad_queue->list);
2654 }
2655
2656 static void init_mad_qp(struct ib_mad_port_private *port_priv,
2657                         struct ib_mad_qp_info *qp_info)
2658 {
2659         qp_info->port_priv = port_priv;
2660         init_mad_queue(qp_info, &qp_info->send_queue);
2661         init_mad_queue(qp_info, &qp_info->recv_queue);
2662         INIT_LIST_HEAD(&qp_info->overflow_list);
2663         spin_lock_init(&qp_info->snoop_lock);
2664         qp_info->snoop_table = NULL;
2665         qp_info->snoop_table_size = 0;
2666         atomic_set(&qp_info->snoop_count, 0);
2667 }
2668
2669 static int create_mad_qp(struct ib_mad_qp_info *qp_info,
2670                          enum ib_qp_type qp_type)
2671 {
2672         struct ib_qp_init_attr  qp_init_attr;
2673         int ret;
2674
2675         memset(&qp_init_attr, 0, sizeof qp_init_attr);
2676         qp_init_attr.send_cq = qp_info->port_priv->cq;
2677         qp_init_attr.recv_cq = qp_info->port_priv->cq;
2678         qp_init_attr.sq_sig_type = IB_SIGNAL_ALL_WR;
2679         qp_init_attr.cap.max_send_wr = IB_MAD_QP_SEND_SIZE;
2680         qp_init_attr.cap.max_recv_wr = IB_MAD_QP_RECV_SIZE;
2681         qp_init_attr.cap.max_send_sge = IB_MAD_SEND_REQ_MAX_SG;
2682         qp_init_attr.cap.max_recv_sge = IB_MAD_RECV_REQ_MAX_SG;
2683         qp_init_attr.qp_type = qp_type;
2684         qp_init_attr.port_num = qp_info->port_priv->port_num;
2685         qp_init_attr.qp_context = qp_info;
2686         qp_init_attr.event_handler = qp_event_handler;
2687         qp_info->qp = ib_create_qp(qp_info->port_priv->pd, &qp_init_attr);
2688         if (IS_ERR(qp_info->qp)) {
2689                 printk(KERN_ERR PFX "Couldn't create ib_mad QP%d\n",
2690                        get_spl_qp_index(qp_type));
2691                 ret = PTR_ERR(qp_info->qp);
2692                 goto error;
2693         }
2694         /* Use minimum queue sizes unless the CQ is resized */
2695         qp_info->send_queue.max_active = IB_MAD_QP_SEND_SIZE;
2696         qp_info->recv_queue.max_active = IB_MAD_QP_RECV_SIZE;
2697         return 0;
2698
2699 error:
2700         return ret;
2701 }
2702
2703 static void destroy_mad_qp(struct ib_mad_qp_info *qp_info)
2704 {
2705         ib_destroy_qp(qp_info->qp);
2706         kfree(qp_info->snoop_table);
2707 }
2708
2709 /*
2710  * Open the port
2711  * Create the QP, PD, MR, and CQ if needed
2712  */
2713 static int ib_mad_port_open(struct ib_device *device,
2714                             int port_num)
2715 {
2716         int ret, cq_size;
2717         struct ib_mad_port_private *port_priv;
2718         unsigned long flags;
2719         char name[sizeof "ib_mad123"];
2720
2721         /* Create new device info */
2722         port_priv = kzalloc(sizeof *port_priv, GFP_KERNEL);
2723         if (!port_priv) {
2724                 printk(KERN_ERR PFX "No memory for ib_mad_port_private\n");
2725                 return -ENOMEM;
2726         }
2727
2728         port_priv->device = device;
2729         port_priv->port_num = port_num;
2730         spin_lock_init(&port_priv->reg_lock);
2731         INIT_LIST_HEAD(&port_priv->agent_list);
2732         init_mad_qp(port_priv, &port_priv->qp_info[0]);
2733         init_mad_qp(port_priv, &port_priv->qp_info[1]);
2734
2735         cq_size = (IB_MAD_QP_SEND_SIZE + IB_MAD_QP_RECV_SIZE) * 2;
2736         port_priv->cq = ib_create_cq(port_priv->device,
2737                                      ib_mad_thread_completion_handler,
2738                                      NULL, port_priv, cq_size);
2739         if (IS_ERR(port_priv->cq)) {
2740                 printk(KERN_ERR PFX "Couldn't create ib_mad CQ\n");
2741                 ret = PTR_ERR(port_priv->cq);
2742                 goto error3;
2743         }
2744
2745         port_priv->pd = ib_alloc_pd(device);
2746         if (IS_ERR(port_priv->pd)) {
2747                 printk(KERN_ERR PFX "Couldn't create ib_mad PD\n");
2748                 ret = PTR_ERR(port_priv->pd);
2749                 goto error4;
2750         }
2751
2752         port_priv->mr = ib_get_dma_mr(port_priv->pd, IB_ACCESS_LOCAL_WRITE);
2753         if (IS_ERR(port_priv->mr)) {
2754                 printk(KERN_ERR PFX "Couldn't get ib_mad DMA MR\n");
2755                 ret = PTR_ERR(port_priv->mr);
2756                 goto error5;
2757         }
2758
2759         ret = create_mad_qp(&port_priv->qp_info[0], IB_QPT_SMI);
2760         if (ret)
2761                 goto error6;
2762         ret = create_mad_qp(&port_priv->qp_info[1], IB_QPT_GSI);
2763         if (ret)
2764                 goto error7;
2765
2766         snprintf(name, sizeof name, "ib_mad%d", port_num);
2767         port_priv->wq = create_singlethread_workqueue(name);
2768         if (!port_priv->wq) {
2769                 ret = -ENOMEM;
2770                 goto error8;
2771         }
2772         INIT_WORK(&port_priv->work, ib_mad_completion_handler, port_priv);
2773
2774         spin_lock_irqsave(&ib_mad_port_list_lock, flags);
2775         list_add_tail(&port_priv->port_list, &ib_mad_port_list);
2776         spin_unlock_irqrestore(&ib_mad_port_list_lock, flags);
2777
2778         ret = ib_mad_port_start(port_priv);
2779         if (ret) {
2780                 printk(KERN_ERR PFX "Couldn't start port\n");
2781                 goto error9;
2782         }
2783
2784         return 0;
2785
2786 error9:
2787         spin_lock_irqsave(&ib_mad_port_list_lock, flags);
2788         list_del_init(&port_priv->port_list);
2789         spin_unlock_irqrestore(&ib_mad_port_list_lock, flags);
2790
2791         destroy_workqueue(port_priv->wq);
2792 error8:
2793         destroy_mad_qp(&port_priv->qp_info[1]);
2794 error7:
2795         destroy_mad_qp(&port_priv->qp_info[0]);
2796 error6:
2797         ib_dereg_mr(port_priv->mr);
2798 error5:
2799         ib_dealloc_pd(port_priv->pd);
2800 error4:
2801         ib_destroy_cq(port_priv->cq);
2802         cleanup_recv_queue(&port_priv->qp_info[1]);
2803         cleanup_recv_queue(&port_priv->qp_info[0]);
2804 error3:
2805         kfree(port_priv);
2806
2807         return ret;
2808 }
2809
2810 /*
2811  * Close the port
2812  * If there are no classes using the port, free the port
2813  * resources (CQ, MR, PD, QP) and remove the port's info structure
2814  */
2815 static int ib_mad_port_close(struct ib_device *device, int port_num)
2816 {
2817         struct ib_mad_port_private *port_priv;
2818         unsigned long flags;
2819
2820         spin_lock_irqsave(&ib_mad_port_list_lock, flags);
2821         port_priv = __ib_get_mad_port(device, port_num);
2822         if (port_priv == NULL) {
2823                 spin_unlock_irqrestore(&ib_mad_port_list_lock, flags);
2824                 printk(KERN_ERR PFX "Port %d not found\n", port_num);
2825                 return -ENODEV;
2826         }
2827         list_del_init(&port_priv->port_list);
2828         spin_unlock_irqrestore(&ib_mad_port_list_lock, flags);
2829
2830         destroy_workqueue(port_priv->wq);
2831         destroy_mad_qp(&port_priv->qp_info[1]);
2832         destroy_mad_qp(&port_priv->qp_info[0]);
2833         ib_dereg_mr(port_priv->mr);
2834         ib_dealloc_pd(port_priv->pd);
2835         ib_destroy_cq(port_priv->cq);
2836         cleanup_recv_queue(&port_priv->qp_info[1]);
2837         cleanup_recv_queue(&port_priv->qp_info[0]);
2838         /* XXX: Handle deallocation of MAD registration tables */
2839
2840         kfree(port_priv);
2841
2842         return 0;
2843 }
2844
2845 static void ib_mad_init_device(struct ib_device *device)
2846 {
2847         int start, end, i;
2848
2849         if (device->node_type == IB_NODE_SWITCH) {
2850                 start = 0;
2851                 end   = 0;
2852         } else {
2853                 start = 1;
2854                 end   = device->phys_port_cnt;
2855         }
2856
2857         for (i = start; i <= end; i++) {
2858                 if (ib_mad_port_open(device, i)) {
2859                         printk(KERN_ERR PFX "Couldn't open %s port %d\n",
2860                                device->name, i);
2861                         goto error;
2862                 }
2863                 if (ib_agent_port_open(device, i)) {
2864                         printk(KERN_ERR PFX "Couldn't open %s port %d "
2865                                "for agents\n",
2866                                device->name, i);
2867                         goto error_agent;
2868                 }
2869         }
2870         return;
2871
2872 error_agent:
2873         if (ib_mad_port_close(device, i))
2874                 printk(KERN_ERR PFX "Couldn't close %s port %d\n",
2875                        device->name, i);
2876
2877 error:
2878         i--;
2879
2880         while (i >= start) {
2881                 if (ib_agent_port_close(device, i))
2882                         printk(KERN_ERR PFX "Couldn't close %s port %d "
2883                                "for agents\n",
2884                                device->name, i);
2885                 if (ib_mad_port_close(device, i))
2886                         printk(KERN_ERR PFX "Couldn't close %s port %d\n",
2887                                device->name, i);
2888                 i--;
2889         }
2890 }
2891
2892 static void ib_mad_remove_device(struct ib_device *device)
2893 {
2894         int i, num_ports, cur_port;
2895
2896         if (device->node_type == IB_NODE_SWITCH) {
2897                 num_ports = 1;
2898                 cur_port = 0;
2899         } else {
2900                 num_ports = device->phys_port_cnt;
2901                 cur_port = 1;
2902         }
2903         for (i = 0; i < num_ports; i++, cur_port++) {
2904                 if (ib_agent_port_close(device, cur_port))
2905                         printk(KERN_ERR PFX "Couldn't close %s port %d "
2906                                "for agents\n",
2907                                device->name, cur_port);
2908                 if (ib_mad_port_close(device, cur_port))
2909                         printk(KERN_ERR PFX "Couldn't close %s port %d\n",
2910                                device->name, cur_port);
2911         }
2912 }
2913
2914 static struct ib_client mad_client = {
2915         .name   = "mad",
2916         .add = ib_mad_init_device,
2917         .remove = ib_mad_remove_device
2918 };
2919
2920 static int __init ib_mad_init_module(void)
2921 {
2922         int ret;
2923
2924         spin_lock_init(&ib_mad_port_list_lock);
2925
2926         ib_mad_cache = kmem_cache_create("ib_mad",
2927                                          sizeof(struct ib_mad_private),
2928                                          0,
2929                                          SLAB_HWCACHE_ALIGN,
2930                                          NULL,
2931                                          NULL);
2932         if (!ib_mad_cache) {
2933                 printk(KERN_ERR PFX "Couldn't create ib_mad cache\n");
2934                 ret = -ENOMEM;
2935                 goto error1;
2936         }
2937
2938         INIT_LIST_HEAD(&ib_mad_port_list);
2939
2940         if (ib_register_client(&mad_client)) {
2941                 printk(KERN_ERR PFX "Couldn't register ib_mad client\n");
2942                 ret = -EINVAL;
2943                 goto error2;
2944         }
2945
2946         return 0;
2947
2948 error2:
2949         kmem_cache_destroy(ib_mad_cache);
2950 error1:
2951         return ret;
2952 }
2953
2954 static void __exit ib_mad_cleanup_module(void)
2955 {
2956         ib_unregister_client(&mad_client);
2957
2958         if (kmem_cache_destroy(ib_mad_cache)) {
2959                 printk(KERN_DEBUG PFX "Failed to destroy ib_mad cache\n");
2960         }
2961 }
2962
2963 module_init(ib_mad_init_module);
2964 module_exit(ib_mad_cleanup_module);
2965