]> nv-tegra.nvidia Code Review - linux-3.10.git/blob - drivers/infiniband/hw/ehca/ehca_main.c
IB/ehca: Support more than 4k QPs for userspace and kernelspace
[linux-3.10.git] / drivers / infiniband / hw / ehca / ehca_main.c
1 /*
2  *  IBM eServer eHCA Infiniband device driver for Linux on POWER
3  *
4  *  module start stop, hca detection
5  *
6  *  Authors: Heiko J Schick <schickhj@de.ibm.com>
7  *           Hoang-Nam Nguyen <hnguyen@de.ibm.com>
8  *           Joachim Fenkes <fenkes@de.ibm.com>
9  *
10  *  Copyright (c) 2005 IBM Corporation
11  *
12  *  All rights reserved.
13  *
14  *  This source code is distributed under a dual license of GPL v2.0 and OpenIB
15  *  BSD.
16  *
17  * OpenIB BSD License
18  *
19  * Redistribution and use in source and binary forms, with or without
20  * modification, are permitted provided that the following conditions are met:
21  *
22  * Redistributions of source code must retain the above copyright notice, this
23  * list of conditions and the following disclaimer.
24  *
25  * Redistributions in binary form must reproduce the above copyright notice,
26  * this list of conditions and the following disclaimer in the documentation
27  * and/or other materials
28  * provided with the distribution.
29  *
30  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
31  * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
32  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
33  * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
34  * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
35  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
36  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
37  * BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER
38  * IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
39  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
40  * POSSIBILITY OF SUCH DAMAGE.
41  */
42
43 #ifdef CONFIG_PPC_64K_PAGES
44 #include <linux/slab.h>
45 #endif
46 #include "ehca_classes.h"
47 #include "ehca_iverbs.h"
48 #include "ehca_mrmw.h"
49 #include "ehca_tools.h"
50 #include "hcp_if.h"
51
52 MODULE_LICENSE("Dual BSD/GPL");
53 MODULE_AUTHOR("Christoph Raisch <raisch@de.ibm.com>");
54 MODULE_DESCRIPTION("IBM eServer HCA InfiniBand Device Driver");
55 MODULE_VERSION("SVNEHCA_0023");
56
57 int ehca_open_aqp1     = 0;
58 int ehca_debug_level   = 0;
59 int ehca_hw_level      = 0;
60 int ehca_nr_ports      = 2;
61 int ehca_use_hp_mr     = 0;
62 int ehca_port_act_time = 30;
63 int ehca_poll_all_eqs  = 1;
64 int ehca_static_rate   = -1;
65 int ehca_scaling_code  = 0;
66 int ehca_mr_largepage  = 0;
67
68 module_param_named(open_aqp1,     ehca_open_aqp1,     int, S_IRUGO);
69 module_param_named(debug_level,   ehca_debug_level,   int, S_IRUGO);
70 module_param_named(hw_level,      ehca_hw_level,      int, S_IRUGO);
71 module_param_named(nr_ports,      ehca_nr_ports,      int, S_IRUGO);
72 module_param_named(use_hp_mr,     ehca_use_hp_mr,     int, S_IRUGO);
73 module_param_named(port_act_time, ehca_port_act_time, int, S_IRUGO);
74 module_param_named(poll_all_eqs,  ehca_poll_all_eqs,  int, S_IRUGO);
75 module_param_named(static_rate,   ehca_static_rate,   int, S_IRUGO);
76 module_param_named(scaling_code,  ehca_scaling_code,  int, S_IRUGO);
77 module_param_named(mr_largepage,  ehca_mr_largepage,  int, S_IRUGO);
78
79 MODULE_PARM_DESC(open_aqp1,
80                  "AQP1 on startup (0: no (default), 1: yes)");
81 MODULE_PARM_DESC(debug_level,
82                  "debug level"
83                  " (0: no debug traces (default), 1: with debug traces)");
84 MODULE_PARM_DESC(hw_level,
85                  "hardware level"
86                  " (0: autosensing (default), 1: v. 0.20, 2: v. 0.21)");
87 MODULE_PARM_DESC(nr_ports,
88                  "number of connected ports (default: 2)");
89 MODULE_PARM_DESC(use_hp_mr,
90                  "high performance MRs (0: no (default), 1: yes)");
91 MODULE_PARM_DESC(port_act_time,
92                  "time to wait for port activation (default: 30 sec)");
93 MODULE_PARM_DESC(poll_all_eqs,
94                  "polls all event queues periodically"
95                  " (0: no, 1: yes (default))");
96 MODULE_PARM_DESC(static_rate,
97                  "set permanent static rate (default: disabled)");
98 MODULE_PARM_DESC(scaling_code,
99                  "set scaling code (0: disabled/default, 1: enabled)");
100 MODULE_PARM_DESC(mr_largepage,
101                  "use large page for MR (0: use PAGE_SIZE (default), "
102                  "1: use large page depending on MR size");
103
104 DEFINE_RWLOCK(ehca_qp_idr_lock);
105 DEFINE_RWLOCK(ehca_cq_idr_lock);
106 DEFINE_IDR(ehca_qp_idr);
107 DEFINE_IDR(ehca_cq_idr);
108
109 static LIST_HEAD(shca_list); /* list of all registered ehcas */
110 static DEFINE_SPINLOCK(shca_list_lock);
111
112 static struct timer_list poll_eqs_timer;
113
114 #ifdef CONFIG_PPC_64K_PAGES
115 static struct kmem_cache *ctblk_cache;
116
117 void *ehca_alloc_fw_ctrlblock(gfp_t flags)
118 {
119         void *ret = kmem_cache_zalloc(ctblk_cache, flags);
120         if (!ret)
121                 ehca_gen_err("Out of memory for ctblk");
122         return ret;
123 }
124
125 void ehca_free_fw_ctrlblock(void *ptr)
126 {
127         if (ptr)
128                 kmem_cache_free(ctblk_cache, ptr);
129
130 }
131 #endif
132
133 int ehca2ib_return_code(u64 ehca_rc)
134 {
135         switch (ehca_rc) {
136         case H_SUCCESS:
137                 return 0;
138         case H_RESOURCE:             /* Resource in use */
139         case H_BUSY:
140                 return -EBUSY;
141         case H_NOT_ENOUGH_RESOURCES: /* insufficient resources */
142         case H_CONSTRAINED:          /* resource constraint */
143         case H_NO_MEM:
144                 return -ENOMEM;
145         default:
146                 return -EINVAL;
147         }
148 }
149
150 static int ehca_create_slab_caches(void)
151 {
152         int ret;
153
154         ret = ehca_init_pd_cache();
155         if (ret) {
156                 ehca_gen_err("Cannot create PD SLAB cache.");
157                 return ret;
158         }
159
160         ret = ehca_init_cq_cache();
161         if (ret) {
162                 ehca_gen_err("Cannot create CQ SLAB cache.");
163                 goto create_slab_caches2;
164         }
165
166         ret = ehca_init_qp_cache();
167         if (ret) {
168                 ehca_gen_err("Cannot create QP SLAB cache.");
169                 goto create_slab_caches3;
170         }
171
172         ret = ehca_init_av_cache();
173         if (ret) {
174                 ehca_gen_err("Cannot create AV SLAB cache.");
175                 goto create_slab_caches4;
176         }
177
178         ret = ehca_init_mrmw_cache();
179         if (ret) {
180                 ehca_gen_err("Cannot create MR&MW SLAB cache.");
181                 goto create_slab_caches5;
182         }
183
184         ret = ehca_init_small_qp_cache();
185         if (ret) {
186                 ehca_gen_err("Cannot create small queue SLAB cache.");
187                 goto create_slab_caches6;
188         }
189
190 #ifdef CONFIG_PPC_64K_PAGES
191         ctblk_cache = kmem_cache_create("ehca_cache_ctblk",
192                                         EHCA_PAGESIZE, H_CB_ALIGNMENT,
193                                         SLAB_HWCACHE_ALIGN,
194                                         NULL);
195         if (!ctblk_cache) {
196                 ehca_gen_err("Cannot create ctblk SLAB cache.");
197                 ehca_cleanup_small_qp_cache();
198                 goto create_slab_caches6;
199         }
200 #endif
201         return 0;
202
203 create_slab_caches6:
204         ehca_cleanup_mrmw_cache();
205
206 create_slab_caches5:
207         ehca_cleanup_av_cache();
208
209 create_slab_caches4:
210         ehca_cleanup_qp_cache();
211
212 create_slab_caches3:
213         ehca_cleanup_cq_cache();
214
215 create_slab_caches2:
216         ehca_cleanup_pd_cache();
217
218         return ret;
219 }
220
221 static void ehca_destroy_slab_caches(void)
222 {
223         ehca_cleanup_small_qp_cache();
224         ehca_cleanup_mrmw_cache();
225         ehca_cleanup_av_cache();
226         ehca_cleanup_qp_cache();
227         ehca_cleanup_cq_cache();
228         ehca_cleanup_pd_cache();
229 #ifdef CONFIG_PPC_64K_PAGES
230         if (ctblk_cache)
231                 kmem_cache_destroy(ctblk_cache);
232 #endif
233 }
234
235 #define EHCA_HCAAVER  EHCA_BMASK_IBM(32, 39)
236 #define EHCA_REVID    EHCA_BMASK_IBM(40, 63)
237
238 static struct cap_descr {
239         u64 mask;
240         char *descr;
241 } hca_cap_descr[] = {
242         { HCA_CAP_AH_PORT_NR_CHECK, "HCA_CAP_AH_PORT_NR_CHECK" },
243         { HCA_CAP_ATOMIC, "HCA_CAP_ATOMIC" },
244         { HCA_CAP_AUTO_PATH_MIG, "HCA_CAP_AUTO_PATH_MIG" },
245         { HCA_CAP_BAD_P_KEY_CTR, "HCA_CAP_BAD_P_KEY_CTR" },
246         { HCA_CAP_SQD_RTS_PORT_CHANGE, "HCA_CAP_SQD_RTS_PORT_CHANGE" },
247         { HCA_CAP_CUR_QP_STATE_MOD, "HCA_CAP_CUR_QP_STATE_MOD" },
248         { HCA_CAP_INIT_TYPE, "HCA_CAP_INIT_TYPE" },
249         { HCA_CAP_PORT_ACTIVE_EVENT, "HCA_CAP_PORT_ACTIVE_EVENT" },
250         { HCA_CAP_Q_KEY_VIOL_CTR, "HCA_CAP_Q_KEY_VIOL_CTR" },
251         { HCA_CAP_WQE_RESIZE, "HCA_CAP_WQE_RESIZE" },
252         { HCA_CAP_RAW_PACKET_MCAST, "HCA_CAP_RAW_PACKET_MCAST" },
253         { HCA_CAP_SHUTDOWN_PORT, "HCA_CAP_SHUTDOWN_PORT" },
254         { HCA_CAP_RC_LL_QP, "HCA_CAP_RC_LL_QP" },
255         { HCA_CAP_SRQ, "HCA_CAP_SRQ" },
256         { HCA_CAP_UD_LL_QP, "HCA_CAP_UD_LL_QP" },
257         { HCA_CAP_RESIZE_MR, "HCA_CAP_RESIZE_MR" },
258         { HCA_CAP_MINI_QP, "HCA_CAP_MINI_QP" },
259 };
260
261 int ehca_sense_attributes(struct ehca_shca *shca)
262 {
263         int i, ret = 0;
264         u64 h_ret;
265         struct hipz_query_hca *rblock;
266         struct hipz_query_port *port;
267
268         rblock = ehca_alloc_fw_ctrlblock(GFP_KERNEL);
269         if (!rblock) {
270                 ehca_gen_err("Cannot allocate rblock memory.");
271                 return -ENOMEM;
272         }
273
274         h_ret = hipz_h_query_hca(shca->ipz_hca_handle, rblock);
275         if (h_ret != H_SUCCESS) {
276                 ehca_gen_err("Cannot query device properties. h_ret=%lx",
277                              h_ret);
278                 ret = -EPERM;
279                 goto sense_attributes1;
280         }
281
282         if (ehca_nr_ports == 1)
283                 shca->num_ports = 1;
284         else
285                 shca->num_ports = (u8)rblock->num_ports;
286
287         ehca_gen_dbg(" ... found %x ports", rblock->num_ports);
288
289         if (ehca_hw_level == 0) {
290                 u32 hcaaver;
291                 u32 revid;
292
293                 hcaaver = EHCA_BMASK_GET(EHCA_HCAAVER, rblock->hw_ver);
294                 revid   = EHCA_BMASK_GET(EHCA_REVID, rblock->hw_ver);
295
296                 ehca_gen_dbg(" ... hardware version=%x:%x", hcaaver, revid);
297
298                 if (hcaaver == 1) {
299                         if (revid <= 3)
300                                 shca->hw_level = 0x10 | (revid + 1);
301                         else
302                                 shca->hw_level = 0x14;
303                 } else if (hcaaver == 2) {
304                         if (revid == 0)
305                                 shca->hw_level = 0x21;
306                         else if (revid == 0x10)
307                                 shca->hw_level = 0x22;
308                         else if (revid == 0x20 || revid == 0x21)
309                                 shca->hw_level = 0x23;
310                 }
311
312                 if (!shca->hw_level) {
313                         ehca_gen_warn("unknown hardware version"
314                                       " - assuming default level");
315                         shca->hw_level = 0x22;
316                 }
317         } else
318                 shca->hw_level = ehca_hw_level;
319         ehca_gen_dbg(" ... hardware level=%x", shca->hw_level);
320
321         shca->sport[0].rate = IB_RATE_30_GBPS;
322         shca->sport[1].rate = IB_RATE_30_GBPS;
323
324         shca->hca_cap = rblock->hca_cap_indicators;
325         ehca_gen_dbg(" ... HCA capabilities:");
326         for (i = 0; i < ARRAY_SIZE(hca_cap_descr); i++)
327                 if (EHCA_BMASK_GET(hca_cap_descr[i].mask, shca->hca_cap))
328                         ehca_gen_dbg("   %s", hca_cap_descr[i].descr);
329
330         shca->hca_cap_mr_pgsize = rblock->memory_page_size_supported;
331
332         port = (struct hipz_query_port *)rblock;
333         h_ret = hipz_h_query_port(shca->ipz_hca_handle, 1, port);
334         if (h_ret != H_SUCCESS) {
335                 ehca_gen_err("Cannot query port properties. h_ret=%lx",
336                              h_ret);
337                 ret = -EPERM;
338                 goto sense_attributes1;
339         }
340
341         shca->max_mtu = port->max_mtu;
342
343 sense_attributes1:
344         ehca_free_fw_ctrlblock(rblock);
345         return ret;
346 }
347
348 static int init_node_guid(struct ehca_shca *shca)
349 {
350         int ret = 0;
351         struct hipz_query_hca *rblock;
352
353         rblock = ehca_alloc_fw_ctrlblock(GFP_KERNEL);
354         if (!rblock) {
355                 ehca_err(&shca->ib_device, "Can't allocate rblock memory.");
356                 return -ENOMEM;
357         }
358
359         if (hipz_h_query_hca(shca->ipz_hca_handle, rblock) != H_SUCCESS) {
360                 ehca_err(&shca->ib_device, "Can't query device properties");
361                 ret = -EINVAL;
362                 goto init_node_guid1;
363         }
364
365         memcpy(&shca->ib_device.node_guid, &rblock->node_guid, sizeof(u64));
366
367 init_node_guid1:
368         ehca_free_fw_ctrlblock(rblock);
369         return ret;
370 }
371
372 int ehca_init_device(struct ehca_shca *shca)
373 {
374         int ret;
375
376         ret = init_node_guid(shca);
377         if (ret)
378                 return ret;
379
380         strlcpy(shca->ib_device.name, "ehca%d", IB_DEVICE_NAME_MAX);
381         shca->ib_device.owner               = THIS_MODULE;
382
383         shca->ib_device.uverbs_abi_ver      = 8;
384         shca->ib_device.uverbs_cmd_mask     =
385                 (1ull << IB_USER_VERBS_CMD_GET_CONTEXT)         |
386                 (1ull << IB_USER_VERBS_CMD_QUERY_DEVICE)        |
387                 (1ull << IB_USER_VERBS_CMD_QUERY_PORT)          |
388                 (1ull << IB_USER_VERBS_CMD_ALLOC_PD)            |
389                 (1ull << IB_USER_VERBS_CMD_DEALLOC_PD)          |
390                 (1ull << IB_USER_VERBS_CMD_REG_MR)              |
391                 (1ull << IB_USER_VERBS_CMD_DEREG_MR)            |
392                 (1ull << IB_USER_VERBS_CMD_CREATE_COMP_CHANNEL) |
393                 (1ull << IB_USER_VERBS_CMD_CREATE_CQ)           |
394                 (1ull << IB_USER_VERBS_CMD_DESTROY_CQ)          |
395                 (1ull << IB_USER_VERBS_CMD_CREATE_QP)           |
396                 (1ull << IB_USER_VERBS_CMD_MODIFY_QP)           |
397                 (1ull << IB_USER_VERBS_CMD_QUERY_QP)            |
398                 (1ull << IB_USER_VERBS_CMD_DESTROY_QP)          |
399                 (1ull << IB_USER_VERBS_CMD_ATTACH_MCAST)        |
400                 (1ull << IB_USER_VERBS_CMD_DETACH_MCAST);
401
402         shca->ib_device.node_type           = RDMA_NODE_IB_CA;
403         shca->ib_device.phys_port_cnt       = shca->num_ports;
404         shca->ib_device.num_comp_vectors    = 1;
405         shca->ib_device.dma_device          = &shca->ibmebus_dev->ofdev.dev;
406         shca->ib_device.query_device        = ehca_query_device;
407         shca->ib_device.query_port          = ehca_query_port;
408         shca->ib_device.query_gid           = ehca_query_gid;
409         shca->ib_device.query_pkey          = ehca_query_pkey;
410         /* shca->in_device.modify_device    = ehca_modify_device    */
411         shca->ib_device.modify_port         = ehca_modify_port;
412         shca->ib_device.alloc_ucontext      = ehca_alloc_ucontext;
413         shca->ib_device.dealloc_ucontext    = ehca_dealloc_ucontext;
414         shca->ib_device.alloc_pd            = ehca_alloc_pd;
415         shca->ib_device.dealloc_pd          = ehca_dealloc_pd;
416         shca->ib_device.create_ah           = ehca_create_ah;
417         /* shca->ib_device.modify_ah        = ehca_modify_ah;       */
418         shca->ib_device.query_ah            = ehca_query_ah;
419         shca->ib_device.destroy_ah          = ehca_destroy_ah;
420         shca->ib_device.create_qp           = ehca_create_qp;
421         shca->ib_device.modify_qp           = ehca_modify_qp;
422         shca->ib_device.query_qp            = ehca_query_qp;
423         shca->ib_device.destroy_qp          = ehca_destroy_qp;
424         shca->ib_device.post_send           = ehca_post_send;
425         shca->ib_device.post_recv           = ehca_post_recv;
426         shca->ib_device.create_cq           = ehca_create_cq;
427         shca->ib_device.destroy_cq          = ehca_destroy_cq;
428         shca->ib_device.resize_cq           = ehca_resize_cq;
429         shca->ib_device.poll_cq             = ehca_poll_cq;
430         /* shca->ib_device.peek_cq          = ehca_peek_cq;         */
431         shca->ib_device.req_notify_cq       = ehca_req_notify_cq;
432         /* shca->ib_device.req_ncomp_notif  = ehca_req_ncomp_notif; */
433         shca->ib_device.get_dma_mr          = ehca_get_dma_mr;
434         shca->ib_device.reg_phys_mr         = ehca_reg_phys_mr;
435         shca->ib_device.reg_user_mr         = ehca_reg_user_mr;
436         shca->ib_device.query_mr            = ehca_query_mr;
437         shca->ib_device.dereg_mr            = ehca_dereg_mr;
438         shca->ib_device.rereg_phys_mr       = ehca_rereg_phys_mr;
439         shca->ib_device.alloc_mw            = ehca_alloc_mw;
440         shca->ib_device.bind_mw             = ehca_bind_mw;
441         shca->ib_device.dealloc_mw          = ehca_dealloc_mw;
442         shca->ib_device.alloc_fmr           = ehca_alloc_fmr;
443         shca->ib_device.map_phys_fmr        = ehca_map_phys_fmr;
444         shca->ib_device.unmap_fmr           = ehca_unmap_fmr;
445         shca->ib_device.dealloc_fmr         = ehca_dealloc_fmr;
446         shca->ib_device.attach_mcast        = ehca_attach_mcast;
447         shca->ib_device.detach_mcast        = ehca_detach_mcast;
448         /* shca->ib_device.process_mad      = ehca_process_mad;     */
449         shca->ib_device.mmap                = ehca_mmap;
450
451         if (EHCA_BMASK_GET(HCA_CAP_SRQ, shca->hca_cap)) {
452                 shca->ib_device.uverbs_cmd_mask |=
453                         (1ull << IB_USER_VERBS_CMD_CREATE_SRQ) |
454                         (1ull << IB_USER_VERBS_CMD_MODIFY_SRQ) |
455                         (1ull << IB_USER_VERBS_CMD_QUERY_SRQ) |
456                         (1ull << IB_USER_VERBS_CMD_DESTROY_SRQ);
457
458                 shca->ib_device.create_srq          = ehca_create_srq;
459                 shca->ib_device.modify_srq          = ehca_modify_srq;
460                 shca->ib_device.query_srq           = ehca_query_srq;
461                 shca->ib_device.destroy_srq         = ehca_destroy_srq;
462                 shca->ib_device.post_srq_recv       = ehca_post_srq_recv;
463         }
464
465         return ret;
466 }
467
468 static int ehca_create_aqp1(struct ehca_shca *shca, u32 port)
469 {
470         struct ehca_sport *sport = &shca->sport[port - 1];
471         struct ib_cq *ibcq;
472         struct ib_qp *ibqp;
473         struct ib_qp_init_attr qp_init_attr;
474         int ret;
475
476         if (sport->ibcq_aqp1) {
477                 ehca_err(&shca->ib_device, "AQP1 CQ is already created.");
478                 return -EPERM;
479         }
480
481         ibcq = ib_create_cq(&shca->ib_device, NULL, NULL, (void *)(-1), 10, 0);
482         if (IS_ERR(ibcq)) {
483                 ehca_err(&shca->ib_device, "Cannot create AQP1 CQ.");
484                 return PTR_ERR(ibcq);
485         }
486         sport->ibcq_aqp1 = ibcq;
487
488         if (sport->ibqp_aqp1) {
489                 ehca_err(&shca->ib_device, "AQP1 QP is already created.");
490                 ret = -EPERM;
491                 goto create_aqp1;
492         }
493
494         memset(&qp_init_attr, 0, sizeof(struct ib_qp_init_attr));
495         qp_init_attr.send_cq          = ibcq;
496         qp_init_attr.recv_cq          = ibcq;
497         qp_init_attr.sq_sig_type      = IB_SIGNAL_ALL_WR;
498         qp_init_attr.cap.max_send_wr  = 100;
499         qp_init_attr.cap.max_recv_wr  = 100;
500         qp_init_attr.cap.max_send_sge = 2;
501         qp_init_attr.cap.max_recv_sge = 1;
502         qp_init_attr.qp_type          = IB_QPT_GSI;
503         qp_init_attr.port_num         = port;
504         qp_init_attr.qp_context       = NULL;
505         qp_init_attr.event_handler    = NULL;
506         qp_init_attr.srq              = NULL;
507
508         ibqp = ib_create_qp(&shca->pd->ib_pd, &qp_init_attr);
509         if (IS_ERR(ibqp)) {
510                 ehca_err(&shca->ib_device, "Cannot create AQP1 QP.");
511                 ret = PTR_ERR(ibqp);
512                 goto create_aqp1;
513         }
514         sport->ibqp_aqp1 = ibqp;
515
516         return 0;
517
518 create_aqp1:
519         ib_destroy_cq(sport->ibcq_aqp1);
520         return ret;
521 }
522
523 static int ehca_destroy_aqp1(struct ehca_sport *sport)
524 {
525         int ret;
526
527         ret = ib_destroy_qp(sport->ibqp_aqp1);
528         if (ret) {
529                 ehca_gen_err("Cannot destroy AQP1 QP. ret=%x", ret);
530                 return ret;
531         }
532
533         ret = ib_destroy_cq(sport->ibcq_aqp1);
534         if (ret)
535                 ehca_gen_err("Cannot destroy AQP1 CQ. ret=%x", ret);
536
537         return ret;
538 }
539
540 static ssize_t ehca_show_debug_level(struct device_driver *ddp, char *buf)
541 {
542         return snprintf(buf, PAGE_SIZE, "%d\n",
543                         ehca_debug_level);
544 }
545
546 static ssize_t ehca_store_debug_level(struct device_driver *ddp,
547                                       const char *buf, size_t count)
548 {
549         int value = (*buf) - '0';
550         if (value >= 0 && value <= 9)
551                 ehca_debug_level = value;
552         return 1;
553 }
554
555 DRIVER_ATTR(debug_level, S_IRUSR | S_IWUSR,
556             ehca_show_debug_level, ehca_store_debug_level);
557
558 static struct attribute *ehca_drv_attrs[] = {
559         &driver_attr_debug_level.attr,
560         NULL
561 };
562
563 static struct attribute_group ehca_drv_attr_grp = {
564         .attrs = ehca_drv_attrs
565 };
566
567 #define EHCA_RESOURCE_ATTR(name)                                           \
568 static ssize_t  ehca_show_##name(struct device *dev,                       \
569                                  struct device_attribute *attr,            \
570                                  char *buf)                                \
571 {                                                                          \
572         struct ehca_shca *shca;                                            \
573         struct hipz_query_hca *rblock;                                     \
574         int data;                                                          \
575                                                                            \
576         shca = dev->driver_data;                                           \
577                                                                            \
578         rblock = ehca_alloc_fw_ctrlblock(GFP_KERNEL);                      \
579         if (!rblock) {                                                     \
580                 dev_err(dev, "Can't allocate rblock memory.");             \
581                 return 0;                                                  \
582         }                                                                  \
583                                                                            \
584         if (hipz_h_query_hca(shca->ipz_hca_handle, rblock) != H_SUCCESS) { \
585                 dev_err(dev, "Can't query device properties");             \
586                 ehca_free_fw_ctrlblock(rblock);                            \
587                 return 0;                                                  \
588         }                                                                  \
589                                                                            \
590         data = rblock->name;                                               \
591         ehca_free_fw_ctrlblock(rblock);                                    \
592                                                                            \
593         if ((strcmp(#name, "num_ports") == 0) && (ehca_nr_ports == 1))     \
594                 return snprintf(buf, 256, "1\n");                          \
595         else                                                               \
596                 return snprintf(buf, 256, "%d\n", data);                   \
597                                                                            \
598 }                                                                          \
599 static DEVICE_ATTR(name, S_IRUGO, ehca_show_##name, NULL);
600
601 EHCA_RESOURCE_ATTR(num_ports);
602 EHCA_RESOURCE_ATTR(hw_ver);
603 EHCA_RESOURCE_ATTR(max_eq);
604 EHCA_RESOURCE_ATTR(cur_eq);
605 EHCA_RESOURCE_ATTR(max_cq);
606 EHCA_RESOURCE_ATTR(cur_cq);
607 EHCA_RESOURCE_ATTR(max_qp);
608 EHCA_RESOURCE_ATTR(cur_qp);
609 EHCA_RESOURCE_ATTR(max_mr);
610 EHCA_RESOURCE_ATTR(cur_mr);
611 EHCA_RESOURCE_ATTR(max_mw);
612 EHCA_RESOURCE_ATTR(cur_mw);
613 EHCA_RESOURCE_ATTR(max_pd);
614 EHCA_RESOURCE_ATTR(max_ah);
615
616 static ssize_t ehca_show_adapter_handle(struct device *dev,
617                                         struct device_attribute *attr,
618                                         char *buf)
619 {
620         struct ehca_shca *shca = dev->driver_data;
621
622         return sprintf(buf, "%lx\n", shca->ipz_hca_handle.handle);
623
624 }
625 static DEVICE_ATTR(adapter_handle, S_IRUGO, ehca_show_adapter_handle, NULL);
626
627 static ssize_t ehca_show_mr_largepage(struct device *dev,
628                                       struct device_attribute *attr,
629                                       char *buf)
630 {
631         return sprintf(buf, "%d\n", ehca_mr_largepage);
632 }
633 static DEVICE_ATTR(mr_largepage, S_IRUGO, ehca_show_mr_largepage, NULL);
634
635 static struct attribute *ehca_dev_attrs[] = {
636         &dev_attr_adapter_handle.attr,
637         &dev_attr_num_ports.attr,
638         &dev_attr_hw_ver.attr,
639         &dev_attr_max_eq.attr,
640         &dev_attr_cur_eq.attr,
641         &dev_attr_max_cq.attr,
642         &dev_attr_cur_cq.attr,
643         &dev_attr_max_qp.attr,
644         &dev_attr_cur_qp.attr,
645         &dev_attr_max_mr.attr,
646         &dev_attr_cur_mr.attr,
647         &dev_attr_max_mw.attr,
648         &dev_attr_cur_mw.attr,
649         &dev_attr_max_pd.attr,
650         &dev_attr_max_ah.attr,
651         &dev_attr_mr_largepage.attr,
652         NULL
653 };
654
655 static struct attribute_group ehca_dev_attr_grp = {
656         .attrs = ehca_dev_attrs
657 };
658
659 static int __devinit ehca_probe(struct ibmebus_dev *dev,
660                                 const struct of_device_id *id)
661 {
662         struct ehca_shca *shca;
663         const u64 *handle;
664         struct ib_pd *ibpd;
665         int ret;
666
667         handle = of_get_property(dev->ofdev.node, "ibm,hca-handle", NULL);
668         if (!handle) {
669                 ehca_gen_err("Cannot get eHCA handle for adapter: %s.",
670                              dev->ofdev.node->full_name);
671                 return -ENODEV;
672         }
673
674         if (!(*handle)) {
675                 ehca_gen_err("Wrong eHCA handle for adapter: %s.",
676                              dev->ofdev.node->full_name);
677                 return -ENODEV;
678         }
679
680         shca = (struct ehca_shca *)ib_alloc_device(sizeof(*shca));
681         if (!shca) {
682                 ehca_gen_err("Cannot allocate shca memory.");
683                 return -ENOMEM;
684         }
685         mutex_init(&shca->modify_mutex);
686
687         shca->ibmebus_dev = dev;
688         shca->ipz_hca_handle.handle = *handle;
689         dev->ofdev.dev.driver_data = shca;
690
691         ret = ehca_sense_attributes(shca);
692         if (ret < 0) {
693                 ehca_gen_err("Cannot sense eHCA attributes.");
694                 goto probe1;
695         }
696
697         ret = ehca_init_device(shca);
698         if (ret) {
699                 ehca_gen_err("Cannot init ehca  device struct");
700                 goto probe1;
701         }
702
703         /* create event queues */
704         ret = ehca_create_eq(shca, &shca->eq, EHCA_EQ, 2048);
705         if (ret) {
706                 ehca_err(&shca->ib_device, "Cannot create EQ.");
707                 goto probe1;
708         }
709
710         ret = ehca_create_eq(shca, &shca->neq, EHCA_NEQ, 513);
711         if (ret) {
712                 ehca_err(&shca->ib_device, "Cannot create NEQ.");
713                 goto probe3;
714         }
715
716         /* create internal protection domain */
717         ibpd = ehca_alloc_pd(&shca->ib_device, (void *)(-1), NULL);
718         if (IS_ERR(ibpd)) {
719                 ehca_err(&shca->ib_device, "Cannot create internal PD.");
720                 ret = PTR_ERR(ibpd);
721                 goto probe4;
722         }
723
724         shca->pd = container_of(ibpd, struct ehca_pd, ib_pd);
725         shca->pd->ib_pd.device = &shca->ib_device;
726
727         /* create internal max MR */
728         ret = ehca_reg_internal_maxmr(shca, shca->pd, &shca->maxmr);
729
730         if (ret) {
731                 ehca_err(&shca->ib_device, "Cannot create internal MR ret=%x",
732                          ret);
733                 goto probe5;
734         }
735
736         ret = ib_register_device(&shca->ib_device);
737         if (ret) {
738                 ehca_err(&shca->ib_device,
739                          "ib_register_device() failed ret=%x", ret);
740                 goto probe6;
741         }
742
743         /* create AQP1 for port 1 */
744         if (ehca_open_aqp1 == 1) {
745                 shca->sport[0].port_state = IB_PORT_DOWN;
746                 ret = ehca_create_aqp1(shca, 1);
747                 if (ret) {
748                         ehca_err(&shca->ib_device,
749                                  "Cannot create AQP1 for port 1.");
750                         goto probe7;
751                 }
752         }
753
754         /* create AQP1 for port 2 */
755         if ((ehca_open_aqp1 == 1) && (shca->num_ports == 2)) {
756                 shca->sport[1].port_state = IB_PORT_DOWN;
757                 ret = ehca_create_aqp1(shca, 2);
758                 if (ret) {
759                         ehca_err(&shca->ib_device,
760                                  "Cannot create AQP1 for port 2.");
761                         goto probe8;
762                 }
763         }
764
765         ret = sysfs_create_group(&dev->ofdev.dev.kobj, &ehca_dev_attr_grp);
766         if (ret) /* only complain; we can live without attributes */
767                 ehca_err(&shca->ib_device,
768                          "Cannot create device attributes  ret=%d", ret);
769
770         spin_lock(&shca_list_lock);
771         list_add(&shca->shca_list, &shca_list);
772         spin_unlock(&shca_list_lock);
773
774         return 0;
775
776 probe8:
777         ret = ehca_destroy_aqp1(&shca->sport[0]);
778         if (ret)
779                 ehca_err(&shca->ib_device,
780                          "Cannot destroy AQP1 for port 1. ret=%x", ret);
781
782 probe7:
783         ib_unregister_device(&shca->ib_device);
784
785 probe6:
786         ret = ehca_dereg_internal_maxmr(shca);
787         if (ret)
788                 ehca_err(&shca->ib_device,
789                          "Cannot destroy internal MR. ret=%x", ret);
790
791 probe5:
792         ret = ehca_dealloc_pd(&shca->pd->ib_pd);
793         if (ret)
794                 ehca_err(&shca->ib_device,
795                          "Cannot destroy internal PD. ret=%x", ret);
796
797 probe4:
798         ret = ehca_destroy_eq(shca, &shca->neq);
799         if (ret)
800                 ehca_err(&shca->ib_device,
801                          "Cannot destroy NEQ. ret=%x", ret);
802
803 probe3:
804         ret = ehca_destroy_eq(shca, &shca->eq);
805         if (ret)
806                 ehca_err(&shca->ib_device,
807                          "Cannot destroy EQ. ret=%x", ret);
808
809 probe1:
810         ib_dealloc_device(&shca->ib_device);
811
812         return -EINVAL;
813 }
814
815 static int __devexit ehca_remove(struct ibmebus_dev *dev)
816 {
817         struct ehca_shca *shca = dev->ofdev.dev.driver_data;
818         int ret;
819
820         sysfs_remove_group(&dev->ofdev.dev.kobj, &ehca_dev_attr_grp);
821
822         if (ehca_open_aqp1 == 1) {
823                 int i;
824                 for (i = 0; i < shca->num_ports; i++) {
825                         ret = ehca_destroy_aqp1(&shca->sport[i]);
826                         if (ret)
827                                 ehca_err(&shca->ib_device,
828                                          "Cannot destroy AQP1 for port %x "
829                                          "ret=%x", ret, i);
830                 }
831         }
832
833         ib_unregister_device(&shca->ib_device);
834
835         ret = ehca_dereg_internal_maxmr(shca);
836         if (ret)
837                 ehca_err(&shca->ib_device,
838                          "Cannot destroy internal MR. ret=%x", ret);
839
840         ret = ehca_dealloc_pd(&shca->pd->ib_pd);
841         if (ret)
842                 ehca_err(&shca->ib_device,
843                          "Cannot destroy internal PD. ret=%x", ret);
844
845         ret = ehca_destroy_eq(shca, &shca->eq);
846         if (ret)
847                 ehca_err(&shca->ib_device, "Cannot destroy EQ. ret=%x", ret);
848
849         ret = ehca_destroy_eq(shca, &shca->neq);
850         if (ret)
851                 ehca_err(&shca->ib_device, "Canot destroy NEQ. ret=%x", ret);
852
853         ib_dealloc_device(&shca->ib_device);
854
855         spin_lock(&shca_list_lock);
856         list_del(&shca->shca_list);
857         spin_unlock(&shca_list_lock);
858
859         return ret;
860 }
861
862 static struct of_device_id ehca_device_table[] =
863 {
864         {
865                 .name       = "lhca",
866                 .compatible = "IBM,lhca",
867         },
868         {},
869 };
870
871 static struct ibmebus_driver ehca_driver = {
872         .name     = "ehca",
873         .id_table = ehca_device_table,
874         .probe    = ehca_probe,
875         .remove   = ehca_remove,
876 };
877
878 void ehca_poll_eqs(unsigned long data)
879 {
880         struct ehca_shca *shca;
881
882         spin_lock(&shca_list_lock);
883         list_for_each_entry(shca, &shca_list, shca_list) {
884                 if (shca->eq.is_initialized) {
885                         /* call deadman proc only if eq ptr does not change */
886                         struct ehca_eq *eq = &shca->eq;
887                         int max = 3;
888                         volatile u64 q_ofs, q_ofs2;
889                         u64 flags;
890                         spin_lock_irqsave(&eq->spinlock, flags);
891                         q_ofs = eq->ipz_queue.current_q_offset;
892                         spin_unlock_irqrestore(&eq->spinlock, flags);
893                         do {
894                                 spin_lock_irqsave(&eq->spinlock, flags);
895                                 q_ofs2 = eq->ipz_queue.current_q_offset;
896                                 spin_unlock_irqrestore(&eq->spinlock, flags);
897                                 max--;
898                         } while (q_ofs == q_ofs2 && max > 0);
899                         if (q_ofs == q_ofs2)
900                                 ehca_process_eq(shca, 0);
901                 }
902         }
903         mod_timer(&poll_eqs_timer, jiffies + HZ);
904         spin_unlock(&shca_list_lock);
905 }
906
907 int __init ehca_module_init(void)
908 {
909         int ret;
910
911         printk(KERN_INFO "eHCA Infiniband Device Driver "
912                "(Rel.: SVNEHCA_0023)\n");
913
914         ret = ehca_create_comp_pool();
915         if (ret) {
916                 ehca_gen_err("Cannot create comp pool.");
917                 return ret;
918         }
919
920         ret = ehca_create_slab_caches();
921         if (ret) {
922                 ehca_gen_err("Cannot create SLAB caches");
923                 ret = -ENOMEM;
924                 goto module_init1;
925         }
926
927         ret = ibmebus_register_driver(&ehca_driver);
928         if (ret) {
929                 ehca_gen_err("Cannot register eHCA device driver");
930                 ret = -EINVAL;
931                 goto module_init2;
932         }
933
934         ret = sysfs_create_group(&ehca_driver.driver.kobj, &ehca_drv_attr_grp);
935         if (ret) /* only complain; we can live without attributes */
936                 ehca_gen_err("Cannot create driver attributes  ret=%d", ret);
937
938         if (ehca_poll_all_eqs != 1) {
939                 ehca_gen_err("WARNING!!!");
940                 ehca_gen_err("It is possible to lose interrupts.");
941         } else {
942                 init_timer(&poll_eqs_timer);
943                 poll_eqs_timer.function = ehca_poll_eqs;
944                 poll_eqs_timer.expires = jiffies + HZ;
945                 add_timer(&poll_eqs_timer);
946         }
947
948         return 0;
949
950 module_init2:
951         ehca_destroy_slab_caches();
952
953 module_init1:
954         ehca_destroy_comp_pool();
955         return ret;
956 };
957
958 void __exit ehca_module_exit(void)
959 {
960         if (ehca_poll_all_eqs == 1)
961                 del_timer_sync(&poll_eqs_timer);
962
963         sysfs_remove_group(&ehca_driver.driver.kobj, &ehca_drv_attr_grp);
964         ibmebus_unregister_driver(&ehca_driver);
965
966         ehca_destroy_slab_caches();
967
968         ehca_destroy_comp_pool();
969
970         idr_destroy(&ehca_cq_idr);
971         idr_destroy(&ehca_qp_idr);
972 };
973
974 module_init(ehca_module_init);
975 module_exit(ehca_module_exit);