Merge git://git.kernel.org/pub/scm/linux/kernel/git/sfrench/cifs-2.6
[pandora-kernel.git] / drivers / infiniband / hw / ehca / ehca_main.c
1 /*
2  *  IBM eServer eHCA Infiniband device driver for Linux on POWER
3  *
4  *  module start stop, hca detection
5  *
6  *  Authors: Heiko J Schick <schickhj@de.ibm.com>
7  *           Hoang-Nam Nguyen <hnguyen@de.ibm.com>
8  *           Joachim Fenkes <fenkes@de.ibm.com>
9  *
10  *  Copyright (c) 2005 IBM Corporation
11  *
12  *  All rights reserved.
13  *
14  *  This source code is distributed under a dual license of GPL v2.0 and OpenIB
15  *  BSD.
16  *
17  * OpenIB BSD License
18  *
19  * Redistribution and use in source and binary forms, with or without
20  * modification, are permitted provided that the following conditions are met:
21  *
22  * Redistributions of source code must retain the above copyright notice, this
23  * list of conditions and the following disclaimer.
24  *
25  * Redistributions in binary form must reproduce the above copyright notice,
26  * this list of conditions and the following disclaimer in the documentation
27  * and/or other materials
28  * provided with the distribution.
29  *
30  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
31  * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
32  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
33  * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
34  * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
35  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
36  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
37  * BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER
38  * IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
39  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
40  * POSSIBILITY OF SUCH DAMAGE.
41  */
42
43 #ifdef CONFIG_PPC_64K_PAGES
44 #include <linux/slab.h>
45 #endif
46
47 #include "ehca_classes.h"
48 #include "ehca_iverbs.h"
49 #include "ehca_mrmw.h"
50 #include "ehca_tools.h"
51 #include "hcp_if.h"
52
53 #define HCAD_VERSION "0025"
54
55 MODULE_LICENSE("Dual BSD/GPL");
56 MODULE_AUTHOR("Christoph Raisch <raisch@de.ibm.com>");
57 MODULE_DESCRIPTION("IBM eServer HCA InfiniBand Device Driver");
58 MODULE_VERSION(HCAD_VERSION);
59
60 int ehca_open_aqp1     = 0;
61 int ehca_debug_level   = 0;
62 int ehca_hw_level      = 0;
63 int ehca_nr_ports      = 2;
64 int ehca_use_hp_mr     = 0;
65 int ehca_port_act_time = 30;
66 int ehca_poll_all_eqs  = 1;
67 int ehca_static_rate   = -1;
68 int ehca_scaling_code  = 0;
69 int ehca_mr_largepage  = 1;
70 int ehca_lock_hcalls   = -1;
71
72 module_param_named(open_aqp1,     ehca_open_aqp1,     int, S_IRUGO);
73 module_param_named(debug_level,   ehca_debug_level,   int, S_IRUGO);
74 module_param_named(hw_level,      ehca_hw_level,      int, S_IRUGO);
75 module_param_named(nr_ports,      ehca_nr_ports,      int, S_IRUGO);
76 module_param_named(use_hp_mr,     ehca_use_hp_mr,     int, S_IRUGO);
77 module_param_named(port_act_time, ehca_port_act_time, int, S_IRUGO);
78 module_param_named(poll_all_eqs,  ehca_poll_all_eqs,  int, S_IRUGO);
79 module_param_named(static_rate,   ehca_static_rate,   int, S_IRUGO);
80 module_param_named(scaling_code,  ehca_scaling_code,  int, S_IRUGO);
81 module_param_named(mr_largepage,  ehca_mr_largepage,  int, S_IRUGO);
82 module_param_named(lock_hcalls,   ehca_lock_hcalls,   bool, S_IRUGO);
83
84 MODULE_PARM_DESC(open_aqp1,
85                  "AQP1 on startup (0: no (default), 1: yes)");
86 MODULE_PARM_DESC(debug_level,
87                  "debug level"
88                  " (0: no debug traces (default), 1: with debug traces)");
89 MODULE_PARM_DESC(hw_level,
90                  "hardware level"
91                  " (0: autosensing (default), 1: v. 0.20, 2: v. 0.21)");
92 MODULE_PARM_DESC(nr_ports,
93                  "number of connected ports (-1: autodetect, 1: port one only, "
94                  "2: two ports (default)");
95 MODULE_PARM_DESC(use_hp_mr,
96                  "high performance MRs (0: no (default), 1: yes)");
97 MODULE_PARM_DESC(port_act_time,
98                  "time to wait for port activation (default: 30 sec)");
99 MODULE_PARM_DESC(poll_all_eqs,
100                  "polls all event queues periodically"
101                  " (0: no, 1: yes (default))");
102 MODULE_PARM_DESC(static_rate,
103                  "set permanent static rate (default: disabled)");
104 MODULE_PARM_DESC(scaling_code,
105                  "set scaling code (0: disabled/default, 1: enabled)");
106 MODULE_PARM_DESC(mr_largepage,
107                  "use large page for MR (0: use PAGE_SIZE (default), "
108                  "1: use large page depending on MR size");
109 MODULE_PARM_DESC(lock_hcalls,
110                  "serialize all hCalls made by the driver "
111                  "(default: autodetect)");
112
113 DEFINE_RWLOCK(ehca_qp_idr_lock);
114 DEFINE_RWLOCK(ehca_cq_idr_lock);
115 DEFINE_IDR(ehca_qp_idr);
116 DEFINE_IDR(ehca_cq_idr);
117
118 static LIST_HEAD(shca_list); /* list of all registered ehcas */
119 static DEFINE_SPINLOCK(shca_list_lock);
120
121 static struct timer_list poll_eqs_timer;
122
123 #ifdef CONFIG_PPC_64K_PAGES
124 static struct kmem_cache *ctblk_cache;
125
126 void *ehca_alloc_fw_ctrlblock(gfp_t flags)
127 {
128         void *ret = kmem_cache_zalloc(ctblk_cache, flags);
129         if (!ret)
130                 ehca_gen_err("Out of memory for ctblk");
131         return ret;
132 }
133
134 void ehca_free_fw_ctrlblock(void *ptr)
135 {
136         if (ptr)
137                 kmem_cache_free(ctblk_cache, ptr);
138
139 }
140 #endif
141
142 int ehca2ib_return_code(u64 ehca_rc)
143 {
144         switch (ehca_rc) {
145         case H_SUCCESS:
146                 return 0;
147         case H_RESOURCE:             /* Resource in use */
148         case H_BUSY:
149                 return -EBUSY;
150         case H_NOT_ENOUGH_RESOURCES: /* insufficient resources */
151         case H_CONSTRAINED:          /* resource constraint */
152         case H_NO_MEM:
153                 return -ENOMEM;
154         default:
155                 return -EINVAL;
156         }
157 }
158
159 static int ehca_create_slab_caches(void)
160 {
161         int ret;
162
163         ret = ehca_init_pd_cache();
164         if (ret) {
165                 ehca_gen_err("Cannot create PD SLAB cache.");
166                 return ret;
167         }
168
169         ret = ehca_init_cq_cache();
170         if (ret) {
171                 ehca_gen_err("Cannot create CQ SLAB cache.");
172                 goto create_slab_caches2;
173         }
174
175         ret = ehca_init_qp_cache();
176         if (ret) {
177                 ehca_gen_err("Cannot create QP SLAB cache.");
178                 goto create_slab_caches3;
179         }
180
181         ret = ehca_init_av_cache();
182         if (ret) {
183                 ehca_gen_err("Cannot create AV SLAB cache.");
184                 goto create_slab_caches4;
185         }
186
187         ret = ehca_init_mrmw_cache();
188         if (ret) {
189                 ehca_gen_err("Cannot create MR&MW SLAB cache.");
190                 goto create_slab_caches5;
191         }
192
193         ret = ehca_init_small_qp_cache();
194         if (ret) {
195                 ehca_gen_err("Cannot create small queue SLAB cache.");
196                 goto create_slab_caches6;
197         }
198
199 #ifdef CONFIG_PPC_64K_PAGES
200         ctblk_cache = kmem_cache_create("ehca_cache_ctblk",
201                                         EHCA_PAGESIZE, H_CB_ALIGNMENT,
202                                         SLAB_HWCACHE_ALIGN,
203                                         NULL);
204         if (!ctblk_cache) {
205                 ehca_gen_err("Cannot create ctblk SLAB cache.");
206                 ehca_cleanup_small_qp_cache();
207                 goto create_slab_caches6;
208         }
209 #endif
210         return 0;
211
212 create_slab_caches6:
213         ehca_cleanup_mrmw_cache();
214
215 create_slab_caches5:
216         ehca_cleanup_av_cache();
217
218 create_slab_caches4:
219         ehca_cleanup_qp_cache();
220
221 create_slab_caches3:
222         ehca_cleanup_cq_cache();
223
224 create_slab_caches2:
225         ehca_cleanup_pd_cache();
226
227         return ret;
228 }
229
230 static void ehca_destroy_slab_caches(void)
231 {
232         ehca_cleanup_small_qp_cache();
233         ehca_cleanup_mrmw_cache();
234         ehca_cleanup_av_cache();
235         ehca_cleanup_qp_cache();
236         ehca_cleanup_cq_cache();
237         ehca_cleanup_pd_cache();
238 #ifdef CONFIG_PPC_64K_PAGES
239         if (ctblk_cache)
240                 kmem_cache_destroy(ctblk_cache);
241 #endif
242 }
243
244 #define EHCA_HCAAVER  EHCA_BMASK_IBM(32, 39)
245 #define EHCA_REVID    EHCA_BMASK_IBM(40, 63)
246
247 static struct cap_descr {
248         u64 mask;
249         char *descr;
250 } hca_cap_descr[] = {
251         { HCA_CAP_AH_PORT_NR_CHECK, "HCA_CAP_AH_PORT_NR_CHECK" },
252         { HCA_CAP_ATOMIC, "HCA_CAP_ATOMIC" },
253         { HCA_CAP_AUTO_PATH_MIG, "HCA_CAP_AUTO_PATH_MIG" },
254         { HCA_CAP_BAD_P_KEY_CTR, "HCA_CAP_BAD_P_KEY_CTR" },
255         { HCA_CAP_SQD_RTS_PORT_CHANGE, "HCA_CAP_SQD_RTS_PORT_CHANGE" },
256         { HCA_CAP_CUR_QP_STATE_MOD, "HCA_CAP_CUR_QP_STATE_MOD" },
257         { HCA_CAP_INIT_TYPE, "HCA_CAP_INIT_TYPE" },
258         { HCA_CAP_PORT_ACTIVE_EVENT, "HCA_CAP_PORT_ACTIVE_EVENT" },
259         { HCA_CAP_Q_KEY_VIOL_CTR, "HCA_CAP_Q_KEY_VIOL_CTR" },
260         { HCA_CAP_WQE_RESIZE, "HCA_CAP_WQE_RESIZE" },
261         { HCA_CAP_RAW_PACKET_MCAST, "HCA_CAP_RAW_PACKET_MCAST" },
262         { HCA_CAP_SHUTDOWN_PORT, "HCA_CAP_SHUTDOWN_PORT" },
263         { HCA_CAP_RC_LL_QP, "HCA_CAP_RC_LL_QP" },
264         { HCA_CAP_SRQ, "HCA_CAP_SRQ" },
265         { HCA_CAP_UD_LL_QP, "HCA_CAP_UD_LL_QP" },
266         { HCA_CAP_RESIZE_MR, "HCA_CAP_RESIZE_MR" },
267         { HCA_CAP_MINI_QP, "HCA_CAP_MINI_QP" },
268         { HCA_CAP_H_ALLOC_RES_SYNC, "HCA_CAP_H_ALLOC_RES_SYNC" },
269 };
270
271 static int ehca_sense_attributes(struct ehca_shca *shca)
272 {
273         int i, ret = 0;
274         u64 h_ret;
275         struct hipz_query_hca *rblock;
276         struct hipz_query_port *port;
277
278         static const u32 pgsize_map[] = {
279                 HCA_CAP_MR_PGSIZE_4K,  0x1000,
280                 HCA_CAP_MR_PGSIZE_64K, 0x10000,
281                 HCA_CAP_MR_PGSIZE_1M,  0x100000,
282                 HCA_CAP_MR_PGSIZE_16M, 0x1000000,
283         };
284
285         rblock = ehca_alloc_fw_ctrlblock(GFP_KERNEL);
286         if (!rblock) {
287                 ehca_gen_err("Cannot allocate rblock memory.");
288                 return -ENOMEM;
289         }
290
291         h_ret = hipz_h_query_hca(shca->ipz_hca_handle, rblock);
292         if (h_ret != H_SUCCESS) {
293                 ehca_gen_err("Cannot query device properties. h_ret=%li",
294                              h_ret);
295                 ret = -EPERM;
296                 goto sense_attributes1;
297         }
298
299         if (ehca_nr_ports == 1)
300                 shca->num_ports = 1;
301         else
302                 shca->num_ports = (u8)rblock->num_ports;
303
304         ehca_gen_dbg(" ... found %x ports", rblock->num_ports);
305
306         if (ehca_hw_level == 0) {
307                 u32 hcaaver;
308                 u32 revid;
309
310                 hcaaver = EHCA_BMASK_GET(EHCA_HCAAVER, rblock->hw_ver);
311                 revid   = EHCA_BMASK_GET(EHCA_REVID, rblock->hw_ver);
312
313                 ehca_gen_dbg(" ... hardware version=%x:%x", hcaaver, revid);
314
315                 if (hcaaver == 1) {
316                         if (revid <= 3)
317                                 shca->hw_level = 0x10 | (revid + 1);
318                         else
319                                 shca->hw_level = 0x14;
320                 } else if (hcaaver == 2) {
321                         if (revid == 0)
322                                 shca->hw_level = 0x21;
323                         else if (revid == 0x10)
324                                 shca->hw_level = 0x22;
325                         else if (revid == 0x20 || revid == 0x21)
326                                 shca->hw_level = 0x23;
327                 }
328
329                 if (!shca->hw_level) {
330                         ehca_gen_warn("unknown hardware version"
331                                       " - assuming default level");
332                         shca->hw_level = 0x22;
333                 }
334         } else
335                 shca->hw_level = ehca_hw_level;
336         ehca_gen_dbg(" ... hardware level=%x", shca->hw_level);
337
338         shca->hca_cap = rblock->hca_cap_indicators;
339         ehca_gen_dbg(" ... HCA capabilities:");
340         for (i = 0; i < ARRAY_SIZE(hca_cap_descr); i++)
341                 if (EHCA_BMASK_GET(hca_cap_descr[i].mask, shca->hca_cap))
342                         ehca_gen_dbg("   %s", hca_cap_descr[i].descr);
343
344         /* Autodetect hCall locking -- the "H_ALLOC_RESOURCE synced" flag is
345          * a firmware property, so it's valid across all adapters
346          */
347         if (ehca_lock_hcalls == -1)
348                 ehca_lock_hcalls = !(shca->hca_cap & HCA_CAP_H_ALLOC_RES_SYNC);
349
350         /* translate supported MR page sizes; always support 4K */
351         shca->hca_cap_mr_pgsize = EHCA_PAGESIZE;
352         if (ehca_mr_largepage) { /* support extra sizes only if enabled */
353                 for (i = 0; i < ARRAY_SIZE(pgsize_map); i += 2)
354                         if (rblock->memory_page_size_supported & pgsize_map[i])
355                                 shca->hca_cap_mr_pgsize |= pgsize_map[i + 1];
356         }
357
358         /* query max MTU from first port -- it's the same for all ports */
359         port = (struct hipz_query_port *)rblock;
360         h_ret = hipz_h_query_port(shca->ipz_hca_handle, 1, port);
361         if (h_ret != H_SUCCESS) {
362                 ehca_gen_err("Cannot query port properties. h_ret=%li",
363                              h_ret);
364                 ret = -EPERM;
365                 goto sense_attributes1;
366         }
367
368         shca->max_mtu = port->max_mtu;
369
370 sense_attributes1:
371         ehca_free_fw_ctrlblock(rblock);
372         return ret;
373 }
374
375 static int init_node_guid(struct ehca_shca *shca)
376 {
377         int ret = 0;
378         struct hipz_query_hca *rblock;
379
380         rblock = ehca_alloc_fw_ctrlblock(GFP_KERNEL);
381         if (!rblock) {
382                 ehca_err(&shca->ib_device, "Can't allocate rblock memory.");
383                 return -ENOMEM;
384         }
385
386         if (hipz_h_query_hca(shca->ipz_hca_handle, rblock) != H_SUCCESS) {
387                 ehca_err(&shca->ib_device, "Can't query device properties");
388                 ret = -EINVAL;
389                 goto init_node_guid1;
390         }
391
392         memcpy(&shca->ib_device.node_guid, &rblock->node_guid, sizeof(u64));
393
394 init_node_guid1:
395         ehca_free_fw_ctrlblock(rblock);
396         return ret;
397 }
398
399 int ehca_init_device(struct ehca_shca *shca)
400 {
401         int ret;
402
403         ret = init_node_guid(shca);
404         if (ret)
405                 return ret;
406
407         strlcpy(shca->ib_device.name, "ehca%d", IB_DEVICE_NAME_MAX);
408         shca->ib_device.owner               = THIS_MODULE;
409
410         shca->ib_device.uverbs_abi_ver      = 8;
411         shca->ib_device.uverbs_cmd_mask     =
412                 (1ull << IB_USER_VERBS_CMD_GET_CONTEXT)         |
413                 (1ull << IB_USER_VERBS_CMD_QUERY_DEVICE)        |
414                 (1ull << IB_USER_VERBS_CMD_QUERY_PORT)          |
415                 (1ull << IB_USER_VERBS_CMD_ALLOC_PD)            |
416                 (1ull << IB_USER_VERBS_CMD_DEALLOC_PD)          |
417                 (1ull << IB_USER_VERBS_CMD_REG_MR)              |
418                 (1ull << IB_USER_VERBS_CMD_DEREG_MR)            |
419                 (1ull << IB_USER_VERBS_CMD_CREATE_COMP_CHANNEL) |
420                 (1ull << IB_USER_VERBS_CMD_CREATE_CQ)           |
421                 (1ull << IB_USER_VERBS_CMD_DESTROY_CQ)          |
422                 (1ull << IB_USER_VERBS_CMD_CREATE_QP)           |
423                 (1ull << IB_USER_VERBS_CMD_MODIFY_QP)           |
424                 (1ull << IB_USER_VERBS_CMD_QUERY_QP)            |
425                 (1ull << IB_USER_VERBS_CMD_DESTROY_QP)          |
426                 (1ull << IB_USER_VERBS_CMD_ATTACH_MCAST)        |
427                 (1ull << IB_USER_VERBS_CMD_DETACH_MCAST);
428
429         shca->ib_device.node_type           = RDMA_NODE_IB_CA;
430         shca->ib_device.phys_port_cnt       = shca->num_ports;
431         shca->ib_device.num_comp_vectors    = 1;
432         shca->ib_device.dma_device          = &shca->ofdev->dev;
433         shca->ib_device.query_device        = ehca_query_device;
434         shca->ib_device.query_port          = ehca_query_port;
435         shca->ib_device.query_gid           = ehca_query_gid;
436         shca->ib_device.query_pkey          = ehca_query_pkey;
437         /* shca->in_device.modify_device    = ehca_modify_device    */
438         shca->ib_device.modify_port         = ehca_modify_port;
439         shca->ib_device.alloc_ucontext      = ehca_alloc_ucontext;
440         shca->ib_device.dealloc_ucontext    = ehca_dealloc_ucontext;
441         shca->ib_device.alloc_pd            = ehca_alloc_pd;
442         shca->ib_device.dealloc_pd          = ehca_dealloc_pd;
443         shca->ib_device.create_ah           = ehca_create_ah;
444         /* shca->ib_device.modify_ah        = ehca_modify_ah;       */
445         shca->ib_device.query_ah            = ehca_query_ah;
446         shca->ib_device.destroy_ah          = ehca_destroy_ah;
447         shca->ib_device.create_qp           = ehca_create_qp;
448         shca->ib_device.modify_qp           = ehca_modify_qp;
449         shca->ib_device.query_qp            = ehca_query_qp;
450         shca->ib_device.destroy_qp          = ehca_destroy_qp;
451         shca->ib_device.post_send           = ehca_post_send;
452         shca->ib_device.post_recv           = ehca_post_recv;
453         shca->ib_device.create_cq           = ehca_create_cq;
454         shca->ib_device.destroy_cq          = ehca_destroy_cq;
455         shca->ib_device.resize_cq           = ehca_resize_cq;
456         shca->ib_device.poll_cq             = ehca_poll_cq;
457         /* shca->ib_device.peek_cq          = ehca_peek_cq;         */
458         shca->ib_device.req_notify_cq       = ehca_req_notify_cq;
459         /* shca->ib_device.req_ncomp_notif  = ehca_req_ncomp_notif; */
460         shca->ib_device.get_dma_mr          = ehca_get_dma_mr;
461         shca->ib_device.reg_phys_mr         = ehca_reg_phys_mr;
462         shca->ib_device.reg_user_mr         = ehca_reg_user_mr;
463         shca->ib_device.query_mr            = ehca_query_mr;
464         shca->ib_device.dereg_mr            = ehca_dereg_mr;
465         shca->ib_device.rereg_phys_mr       = ehca_rereg_phys_mr;
466         shca->ib_device.alloc_mw            = ehca_alloc_mw;
467         shca->ib_device.bind_mw             = ehca_bind_mw;
468         shca->ib_device.dealloc_mw          = ehca_dealloc_mw;
469         shca->ib_device.alloc_fmr           = ehca_alloc_fmr;
470         shca->ib_device.map_phys_fmr        = ehca_map_phys_fmr;
471         shca->ib_device.unmap_fmr           = ehca_unmap_fmr;
472         shca->ib_device.dealloc_fmr         = ehca_dealloc_fmr;
473         shca->ib_device.attach_mcast        = ehca_attach_mcast;
474         shca->ib_device.detach_mcast        = ehca_detach_mcast;
475         /* shca->ib_device.process_mad      = ehca_process_mad;     */
476         shca->ib_device.mmap                = ehca_mmap;
477
478         if (EHCA_BMASK_GET(HCA_CAP_SRQ, shca->hca_cap)) {
479                 shca->ib_device.uverbs_cmd_mask |=
480                         (1ull << IB_USER_VERBS_CMD_CREATE_SRQ) |
481                         (1ull << IB_USER_VERBS_CMD_MODIFY_SRQ) |
482                         (1ull << IB_USER_VERBS_CMD_QUERY_SRQ) |
483                         (1ull << IB_USER_VERBS_CMD_DESTROY_SRQ);
484
485                 shca->ib_device.create_srq          = ehca_create_srq;
486                 shca->ib_device.modify_srq          = ehca_modify_srq;
487                 shca->ib_device.query_srq           = ehca_query_srq;
488                 shca->ib_device.destroy_srq         = ehca_destroy_srq;
489                 shca->ib_device.post_srq_recv       = ehca_post_srq_recv;
490         }
491
492         return ret;
493 }
494
495 static int ehca_create_aqp1(struct ehca_shca *shca, u32 port)
496 {
497         struct ehca_sport *sport = &shca->sport[port - 1];
498         struct ib_cq *ibcq;
499         struct ib_qp *ibqp;
500         struct ib_qp_init_attr qp_init_attr;
501         int ret;
502
503         if (sport->ibcq_aqp1) {
504                 ehca_err(&shca->ib_device, "AQP1 CQ is already created.");
505                 return -EPERM;
506         }
507
508         ibcq = ib_create_cq(&shca->ib_device, NULL, NULL, (void *)(-1), 10, 0);
509         if (IS_ERR(ibcq)) {
510                 ehca_err(&shca->ib_device, "Cannot create AQP1 CQ.");
511                 return PTR_ERR(ibcq);
512         }
513         sport->ibcq_aqp1 = ibcq;
514
515         if (sport->ibqp_sqp[IB_QPT_GSI]) {
516                 ehca_err(&shca->ib_device, "AQP1 QP is already created.");
517                 ret = -EPERM;
518                 goto create_aqp1;
519         }
520
521         memset(&qp_init_attr, 0, sizeof(struct ib_qp_init_attr));
522         qp_init_attr.send_cq          = ibcq;
523         qp_init_attr.recv_cq          = ibcq;
524         qp_init_attr.sq_sig_type      = IB_SIGNAL_ALL_WR;
525         qp_init_attr.cap.max_send_wr  = 100;
526         qp_init_attr.cap.max_recv_wr  = 100;
527         qp_init_attr.cap.max_send_sge = 2;
528         qp_init_attr.cap.max_recv_sge = 1;
529         qp_init_attr.qp_type          = IB_QPT_GSI;
530         qp_init_attr.port_num         = port;
531         qp_init_attr.qp_context       = NULL;
532         qp_init_attr.event_handler    = NULL;
533         qp_init_attr.srq              = NULL;
534
535         ibqp = ib_create_qp(&shca->pd->ib_pd, &qp_init_attr);
536         if (IS_ERR(ibqp)) {
537                 ehca_err(&shca->ib_device, "Cannot create AQP1 QP.");
538                 ret = PTR_ERR(ibqp);
539                 goto create_aqp1;
540         }
541         sport->ibqp_sqp[IB_QPT_GSI] = ibqp;
542
543         return 0;
544
545 create_aqp1:
546         ib_destroy_cq(sport->ibcq_aqp1);
547         return ret;
548 }
549
550 static int ehca_destroy_aqp1(struct ehca_sport *sport)
551 {
552         int ret;
553
554         ret = ib_destroy_qp(sport->ibqp_sqp[IB_QPT_GSI]);
555         if (ret) {
556                 ehca_gen_err("Cannot destroy AQP1 QP. ret=%i", ret);
557                 return ret;
558         }
559
560         ret = ib_destroy_cq(sport->ibcq_aqp1);
561         if (ret)
562                 ehca_gen_err("Cannot destroy AQP1 CQ. ret=%i", ret);
563
564         return ret;
565 }
566
567 static ssize_t ehca_show_debug_level(struct device_driver *ddp, char *buf)
568 {
569         return snprintf(buf, PAGE_SIZE, "%d\n",
570                         ehca_debug_level);
571 }
572
573 static ssize_t ehca_store_debug_level(struct device_driver *ddp,
574                                       const char *buf, size_t count)
575 {
576         int value = (*buf) - '0';
577         if (value >= 0 && value <= 9)
578                 ehca_debug_level = value;
579         return 1;
580 }
581
582 DRIVER_ATTR(debug_level, S_IRUSR | S_IWUSR,
583             ehca_show_debug_level, ehca_store_debug_level);
584
585 static struct attribute *ehca_drv_attrs[] = {
586         &driver_attr_debug_level.attr,
587         NULL
588 };
589
590 static struct attribute_group ehca_drv_attr_grp = {
591         .attrs = ehca_drv_attrs
592 };
593
594 static struct attribute_group *ehca_drv_attr_groups[] = {
595         &ehca_drv_attr_grp,
596         NULL,
597 };
598
599 #define EHCA_RESOURCE_ATTR(name)                                           \
600 static ssize_t  ehca_show_##name(struct device *dev,                       \
601                                  struct device_attribute *attr,            \
602                                  char *buf)                                \
603 {                                                                          \
604         struct ehca_shca *shca;                                            \
605         struct hipz_query_hca *rblock;                                     \
606         int data;                                                          \
607                                                                            \
608         shca = dev->driver_data;                                           \
609                                                                            \
610         rblock = ehca_alloc_fw_ctrlblock(GFP_KERNEL);                      \
611         if (!rblock) {                                                     \
612                 dev_err(dev, "Can't allocate rblock memory.\n");           \
613                 return 0;                                                  \
614         }                                                                  \
615                                                                            \
616         if (hipz_h_query_hca(shca->ipz_hca_handle, rblock) != H_SUCCESS) { \
617                 dev_err(dev, "Can't query device properties\n");           \
618                 ehca_free_fw_ctrlblock(rblock);                            \
619                 return 0;                                                  \
620         }                                                                  \
621                                                                            \
622         data = rblock->name;                                               \
623         ehca_free_fw_ctrlblock(rblock);                                    \
624                                                                            \
625         if ((strcmp(#name, "num_ports") == 0) && (ehca_nr_ports == 1))     \
626                 return snprintf(buf, 256, "1\n");                          \
627         else                                                               \
628                 return snprintf(buf, 256, "%d\n", data);                   \
629                                                                            \
630 }                                                                          \
631 static DEVICE_ATTR(name, S_IRUGO, ehca_show_##name, NULL);
632
633 EHCA_RESOURCE_ATTR(num_ports);
634 EHCA_RESOURCE_ATTR(hw_ver);
635 EHCA_RESOURCE_ATTR(max_eq);
636 EHCA_RESOURCE_ATTR(cur_eq);
637 EHCA_RESOURCE_ATTR(max_cq);
638 EHCA_RESOURCE_ATTR(cur_cq);
639 EHCA_RESOURCE_ATTR(max_qp);
640 EHCA_RESOURCE_ATTR(cur_qp);
641 EHCA_RESOURCE_ATTR(max_mr);
642 EHCA_RESOURCE_ATTR(cur_mr);
643 EHCA_RESOURCE_ATTR(max_mw);
644 EHCA_RESOURCE_ATTR(cur_mw);
645 EHCA_RESOURCE_ATTR(max_pd);
646 EHCA_RESOURCE_ATTR(max_ah);
647
648 static ssize_t ehca_show_adapter_handle(struct device *dev,
649                                         struct device_attribute *attr,
650                                         char *buf)
651 {
652         struct ehca_shca *shca = dev->driver_data;
653
654         return sprintf(buf, "%lx\n", shca->ipz_hca_handle.handle);
655
656 }
657 static DEVICE_ATTR(adapter_handle, S_IRUGO, ehca_show_adapter_handle, NULL);
658
659 static ssize_t ehca_show_mr_largepage(struct device *dev,
660                                       struct device_attribute *attr,
661                                       char *buf)
662 {
663         return sprintf(buf, "%d\n", ehca_mr_largepage);
664 }
665 static DEVICE_ATTR(mr_largepage, S_IRUGO, ehca_show_mr_largepage, NULL);
666
667 static struct attribute *ehca_dev_attrs[] = {
668         &dev_attr_adapter_handle.attr,
669         &dev_attr_num_ports.attr,
670         &dev_attr_hw_ver.attr,
671         &dev_attr_max_eq.attr,
672         &dev_attr_cur_eq.attr,
673         &dev_attr_max_cq.attr,
674         &dev_attr_cur_cq.attr,
675         &dev_attr_max_qp.attr,
676         &dev_attr_cur_qp.attr,
677         &dev_attr_max_mr.attr,
678         &dev_attr_cur_mr.attr,
679         &dev_attr_max_mw.attr,
680         &dev_attr_cur_mw.attr,
681         &dev_attr_max_pd.attr,
682         &dev_attr_max_ah.attr,
683         &dev_attr_mr_largepage.attr,
684         NULL
685 };
686
687 static struct attribute_group ehca_dev_attr_grp = {
688         .attrs = ehca_dev_attrs
689 };
690
691 static int __devinit ehca_probe(struct of_device *dev,
692                                 const struct of_device_id *id)
693 {
694         struct ehca_shca *shca;
695         const u64 *handle;
696         struct ib_pd *ibpd;
697         int ret, i;
698
699         handle = of_get_property(dev->node, "ibm,hca-handle", NULL);
700         if (!handle) {
701                 ehca_gen_err("Cannot get eHCA handle for adapter: %s.",
702                              dev->node->full_name);
703                 return -ENODEV;
704         }
705
706         if (!(*handle)) {
707                 ehca_gen_err("Wrong eHCA handle for adapter: %s.",
708                              dev->node->full_name);
709                 return -ENODEV;
710         }
711
712         shca = (struct ehca_shca *)ib_alloc_device(sizeof(*shca));
713         if (!shca) {
714                 ehca_gen_err("Cannot allocate shca memory.");
715                 return -ENOMEM;
716         }
717         mutex_init(&shca->modify_mutex);
718         for (i = 0; i < ARRAY_SIZE(shca->sport); i++)
719                 spin_lock_init(&shca->sport[i].mod_sqp_lock);
720
721         shca->ofdev = dev;
722         shca->ipz_hca_handle.handle = *handle;
723         dev->dev.driver_data = shca;
724
725         ret = ehca_sense_attributes(shca);
726         if (ret < 0) {
727                 ehca_gen_err("Cannot sense eHCA attributes.");
728                 goto probe1;
729         }
730
731         ret = ehca_init_device(shca);
732         if (ret) {
733                 ehca_gen_err("Cannot init ehca  device struct");
734                 goto probe1;
735         }
736
737         /* create event queues */
738         ret = ehca_create_eq(shca, &shca->eq, EHCA_EQ, 2048);
739         if (ret) {
740                 ehca_err(&shca->ib_device, "Cannot create EQ.");
741                 goto probe1;
742         }
743
744         ret = ehca_create_eq(shca, &shca->neq, EHCA_NEQ, 513);
745         if (ret) {
746                 ehca_err(&shca->ib_device, "Cannot create NEQ.");
747                 goto probe3;
748         }
749
750         /* create internal protection domain */
751         ibpd = ehca_alloc_pd(&shca->ib_device, (void *)(-1), NULL);
752         if (IS_ERR(ibpd)) {
753                 ehca_err(&shca->ib_device, "Cannot create internal PD.");
754                 ret = PTR_ERR(ibpd);
755                 goto probe4;
756         }
757
758         shca->pd = container_of(ibpd, struct ehca_pd, ib_pd);
759         shca->pd->ib_pd.device = &shca->ib_device;
760
761         /* create internal max MR */
762         ret = ehca_reg_internal_maxmr(shca, shca->pd, &shca->maxmr);
763
764         if (ret) {
765                 ehca_err(&shca->ib_device, "Cannot create internal MR ret=%i",
766                          ret);
767                 goto probe5;
768         }
769
770         ret = ib_register_device(&shca->ib_device);
771         if (ret) {
772                 ehca_err(&shca->ib_device,
773                          "ib_register_device() failed ret=%i", ret);
774                 goto probe6;
775         }
776
777         /* create AQP1 for port 1 */
778         if (ehca_open_aqp1 == 1) {
779                 shca->sport[0].port_state = IB_PORT_DOWN;
780                 ret = ehca_create_aqp1(shca, 1);
781                 if (ret) {
782                         ehca_err(&shca->ib_device,
783                                  "Cannot create AQP1 for port 1.");
784                         goto probe7;
785                 }
786         }
787
788         /* create AQP1 for port 2 */
789         if ((ehca_open_aqp1 == 1) && (shca->num_ports == 2)) {
790                 shca->sport[1].port_state = IB_PORT_DOWN;
791                 ret = ehca_create_aqp1(shca, 2);
792                 if (ret) {
793                         ehca_err(&shca->ib_device,
794                                  "Cannot create AQP1 for port 2.");
795                         goto probe8;
796                 }
797         }
798
799         ret = sysfs_create_group(&dev->dev.kobj, &ehca_dev_attr_grp);
800         if (ret) /* only complain; we can live without attributes */
801                 ehca_err(&shca->ib_device,
802                          "Cannot create device attributes  ret=%d", ret);
803
804         spin_lock(&shca_list_lock);
805         list_add(&shca->shca_list, &shca_list);
806         spin_unlock(&shca_list_lock);
807
808         return 0;
809
810 probe8:
811         ret = ehca_destroy_aqp1(&shca->sport[0]);
812         if (ret)
813                 ehca_err(&shca->ib_device,
814                          "Cannot destroy AQP1 for port 1. ret=%i", ret);
815
816 probe7:
817         ib_unregister_device(&shca->ib_device);
818
819 probe6:
820         ret = ehca_dereg_internal_maxmr(shca);
821         if (ret)
822                 ehca_err(&shca->ib_device,
823                          "Cannot destroy internal MR. ret=%x", ret);
824
825 probe5:
826         ret = ehca_dealloc_pd(&shca->pd->ib_pd);
827         if (ret)
828                 ehca_err(&shca->ib_device,
829                          "Cannot destroy internal PD. ret=%x", ret);
830
831 probe4:
832         ret = ehca_destroy_eq(shca, &shca->neq);
833         if (ret)
834                 ehca_err(&shca->ib_device,
835                          "Cannot destroy NEQ. ret=%x", ret);
836
837 probe3:
838         ret = ehca_destroy_eq(shca, &shca->eq);
839         if (ret)
840                 ehca_err(&shca->ib_device,
841                          "Cannot destroy EQ. ret=%x", ret);
842
843 probe1:
844         ib_dealloc_device(&shca->ib_device);
845
846         return -EINVAL;
847 }
848
849 static int __devexit ehca_remove(struct of_device *dev)
850 {
851         struct ehca_shca *shca = dev->dev.driver_data;
852         int ret;
853
854         sysfs_remove_group(&dev->dev.kobj, &ehca_dev_attr_grp);
855
856         if (ehca_open_aqp1 == 1) {
857                 int i;
858                 for (i = 0; i < shca->num_ports; i++) {
859                         ret = ehca_destroy_aqp1(&shca->sport[i]);
860                         if (ret)
861                                 ehca_err(&shca->ib_device,
862                                          "Cannot destroy AQP1 for port %x "
863                                          "ret=%i", ret, i);
864                 }
865         }
866
867         ib_unregister_device(&shca->ib_device);
868
869         ret = ehca_dereg_internal_maxmr(shca);
870         if (ret)
871                 ehca_err(&shca->ib_device,
872                          "Cannot destroy internal MR. ret=%i", ret);
873
874         ret = ehca_dealloc_pd(&shca->pd->ib_pd);
875         if (ret)
876                 ehca_err(&shca->ib_device,
877                          "Cannot destroy internal PD. ret=%i", ret);
878
879         ret = ehca_destroy_eq(shca, &shca->eq);
880         if (ret)
881                 ehca_err(&shca->ib_device, "Cannot destroy EQ. ret=%i", ret);
882
883         ret = ehca_destroy_eq(shca, &shca->neq);
884         if (ret)
885                 ehca_err(&shca->ib_device, "Canot destroy NEQ. ret=%i", ret);
886
887         ib_dealloc_device(&shca->ib_device);
888
889         spin_lock(&shca_list_lock);
890         list_del(&shca->shca_list);
891         spin_unlock(&shca_list_lock);
892
893         return ret;
894 }
895
896 static struct of_device_id ehca_device_table[] =
897 {
898         {
899                 .name       = "lhca",
900                 .compatible = "IBM,lhca",
901         },
902         {},
903 };
904
905 static struct of_platform_driver ehca_driver = {
906         .name        = "ehca",
907         .match_table = ehca_device_table,
908         .probe       = ehca_probe,
909         .remove      = ehca_remove,
910         .driver      = {
911                 .groups = ehca_drv_attr_groups,
912         },
913 };
914
915 void ehca_poll_eqs(unsigned long data)
916 {
917         struct ehca_shca *shca;
918
919         spin_lock(&shca_list_lock);
920         list_for_each_entry(shca, &shca_list, shca_list) {
921                 if (shca->eq.is_initialized) {
922                         /* call deadman proc only if eq ptr does not change */
923                         struct ehca_eq *eq = &shca->eq;
924                         int max = 3;
925                         volatile u64 q_ofs, q_ofs2;
926                         u64 flags;
927                         spin_lock_irqsave(&eq->spinlock, flags);
928                         q_ofs = eq->ipz_queue.current_q_offset;
929                         spin_unlock_irqrestore(&eq->spinlock, flags);
930                         do {
931                                 spin_lock_irqsave(&eq->spinlock, flags);
932                                 q_ofs2 = eq->ipz_queue.current_q_offset;
933                                 spin_unlock_irqrestore(&eq->spinlock, flags);
934                                 max--;
935                         } while (q_ofs == q_ofs2 && max > 0);
936                         if (q_ofs == q_ofs2)
937                                 ehca_process_eq(shca, 0);
938                 }
939         }
940         mod_timer(&poll_eqs_timer, round_jiffies(jiffies + HZ));
941         spin_unlock(&shca_list_lock);
942 }
943
944 int __init ehca_module_init(void)
945 {
946         int ret;
947
948         printk(KERN_INFO "eHCA Infiniband Device Driver "
949                "(Version " HCAD_VERSION ")\n");
950
951         ret = ehca_create_comp_pool();
952         if (ret) {
953                 ehca_gen_err("Cannot create comp pool.");
954                 return ret;
955         }
956
957         ret = ehca_create_slab_caches();
958         if (ret) {
959                 ehca_gen_err("Cannot create SLAB caches");
960                 ret = -ENOMEM;
961                 goto module_init1;
962         }
963
964         ret = ibmebus_register_driver(&ehca_driver);
965         if (ret) {
966                 ehca_gen_err("Cannot register eHCA device driver");
967                 ret = -EINVAL;
968                 goto module_init2;
969         }
970
971         if (ehca_poll_all_eqs != 1) {
972                 ehca_gen_err("WARNING!!!");
973                 ehca_gen_err("It is possible to lose interrupts.");
974         } else {
975                 init_timer(&poll_eqs_timer);
976                 poll_eqs_timer.function = ehca_poll_eqs;
977                 poll_eqs_timer.expires = jiffies + HZ;
978                 add_timer(&poll_eqs_timer);
979         }
980
981         return 0;
982
983 module_init2:
984         ehca_destroy_slab_caches();
985
986 module_init1:
987         ehca_destroy_comp_pool();
988         return ret;
989 };
990
991 void __exit ehca_module_exit(void)
992 {
993         if (ehca_poll_all_eqs == 1)
994                 del_timer_sync(&poll_eqs_timer);
995
996         ibmebus_unregister_driver(&ehca_driver);
997
998         ehca_destroy_slab_caches();
999
1000         ehca_destroy_comp_pool();
1001
1002         idr_destroy(&ehca_cq_idr);
1003         idr_destroy(&ehca_qp_idr);
1004 };
1005
1006 module_init(ehca_module_init);
1007 module_exit(ehca_module_exit);