]> git.kernelconcepts.de Git - karo-tx-linux.git/blob - drivers/staging/rdma/ehca/ehca_main.c
Merge tag 'for-linus' of git://git.kernel.org/pub/scm/linux/kernel/git/dledford/rdma
[karo-tx-linux.git] / drivers / staging / rdma / ehca / ehca_main.c
1 /*
2  *  IBM eServer eHCA Infiniband device driver for Linux on POWER
3  *
4  *  module start stop, hca detection
5  *
6  *  Authors: Heiko J Schick <schickhj@de.ibm.com>
7  *           Hoang-Nam Nguyen <hnguyen@de.ibm.com>
8  *           Joachim Fenkes <fenkes@de.ibm.com>
9  *
10  *  Copyright (c) 2005 IBM Corporation
11  *
12  *  All rights reserved.
13  *
14  *  This source code is distributed under a dual license of GPL v2.0 and OpenIB
15  *  BSD.
16  *
17  * OpenIB BSD License
18  *
19  * Redistribution and use in source and binary forms, with or without
20  * modification, are permitted provided that the following conditions are met:
21  *
22  * Redistributions of source code must retain the above copyright notice, this
23  * list of conditions and the following disclaimer.
24  *
25  * Redistributions in binary form must reproduce the above copyright notice,
26  * this list of conditions and the following disclaimer in the documentation
27  * and/or other materials
28  * provided with the distribution.
29  *
30  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
31  * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
32  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
33  * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
34  * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
35  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
36  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
37  * BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER
38  * IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
39  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
40  * POSSIBILITY OF SUCH DAMAGE.
41  */
42
43 #ifdef CONFIG_PPC_64K_PAGES
44 #include <linux/slab.h>
45 #endif
46
47 #include <linux/notifier.h>
48 #include <linux/memory.h>
49 #include <rdma/ib_mad.h>
50 #include "ehca_classes.h"
51 #include "ehca_iverbs.h"
52 #include "ehca_mrmw.h"
53 #include "ehca_tools.h"
54 #include "hcp_if.h"
55
56 #define HCAD_VERSION "0029"
57
58 MODULE_LICENSE("Dual BSD/GPL");
59 MODULE_AUTHOR("Christoph Raisch <raisch@de.ibm.com>");
60 MODULE_DESCRIPTION("IBM eServer HCA InfiniBand Device Driver");
61 MODULE_VERSION(HCAD_VERSION);
62
63 static bool ehca_open_aqp1    = 0;
64 static int ehca_hw_level      = 0;
65 static bool ehca_poll_all_eqs = 1;
66
67 int ehca_debug_level   = 0;
68 int ehca_nr_ports      = -1;
69 bool ehca_use_hp_mr    = 0;
70 int ehca_port_act_time = 30;
71 int ehca_static_rate   = -1;
72 bool ehca_scaling_code = 0;
73 int ehca_lock_hcalls   = -1;
74 int ehca_max_cq        = -1;
75 int ehca_max_qp        = -1;
76
77 module_param_named(open_aqp1,     ehca_open_aqp1,     bool, S_IRUGO);
78 module_param_named(debug_level,   ehca_debug_level,   int,  S_IRUGO);
79 module_param_named(hw_level,      ehca_hw_level,      int,  S_IRUGO);
80 module_param_named(nr_ports,      ehca_nr_ports,      int,  S_IRUGO);
81 module_param_named(use_hp_mr,     ehca_use_hp_mr,     bool, S_IRUGO);
82 module_param_named(port_act_time, ehca_port_act_time, int,  S_IRUGO);
83 module_param_named(poll_all_eqs,  ehca_poll_all_eqs,  bool, S_IRUGO);
84 module_param_named(static_rate,   ehca_static_rate,   int,  S_IRUGO);
85 module_param_named(scaling_code,  ehca_scaling_code,  bool, S_IRUGO);
86 module_param_named(lock_hcalls,   ehca_lock_hcalls,   bint, S_IRUGO);
87 module_param_named(number_of_cqs, ehca_max_cq,        int,  S_IRUGO);
88 module_param_named(number_of_qps, ehca_max_qp,        int,  S_IRUGO);
89
90 MODULE_PARM_DESC(open_aqp1,
91                  "Open AQP1 on startup (default: no)");
92 MODULE_PARM_DESC(debug_level,
93                  "Amount of debug output (0: none (default), 1: traces, "
94                  "2: some dumps, 3: lots)");
95 MODULE_PARM_DESC(hw_level,
96                  "Hardware level (0: autosensing (default), "
97                  "0x10..0x14: eHCA, 0x20..0x23: eHCA2)");
98 MODULE_PARM_DESC(nr_ports,
99                  "number of connected ports (-1: autodetect (default), "
100                  "1: port one only, 2: two ports)");
101 MODULE_PARM_DESC(use_hp_mr,
102                  "Use high performance MRs (default: no)");
103 MODULE_PARM_DESC(port_act_time,
104                  "Time to wait for port activation (default: 30 sec)");
105 MODULE_PARM_DESC(poll_all_eqs,
106                  "Poll all event queues periodically (default: yes)");
107 MODULE_PARM_DESC(static_rate,
108                  "Set permanent static rate (default: no static rate)");
109 MODULE_PARM_DESC(scaling_code,
110                  "Enable scaling code (default: no)");
111 MODULE_PARM_DESC(lock_hcalls,
112                  "Serialize all hCalls made by the driver "
113                  "(default: autodetect)");
114 MODULE_PARM_DESC(number_of_cqs,
115                 "Max number of CQs which can be allocated "
116                 "(default: autodetect)");
117 MODULE_PARM_DESC(number_of_qps,
118                 "Max number of QPs which can be allocated "
119                 "(default: autodetect)");
120
121 DEFINE_RWLOCK(ehca_qp_idr_lock);
122 DEFINE_RWLOCK(ehca_cq_idr_lock);
123 DEFINE_IDR(ehca_qp_idr);
124 DEFINE_IDR(ehca_cq_idr);
125
126 static LIST_HEAD(shca_list); /* list of all registered ehcas */
127 DEFINE_SPINLOCK(shca_list_lock);
128
129 static struct timer_list poll_eqs_timer;
130
131 #ifdef CONFIG_PPC_64K_PAGES
132 static struct kmem_cache *ctblk_cache;
133
134 void *ehca_alloc_fw_ctrlblock(gfp_t flags)
135 {
136         void *ret = kmem_cache_zalloc(ctblk_cache, flags);
137         if (!ret)
138                 ehca_gen_err("Out of memory for ctblk");
139         return ret;
140 }
141
142 void ehca_free_fw_ctrlblock(void *ptr)
143 {
144         if (ptr)
145                 kmem_cache_free(ctblk_cache, ptr);
146
147 }
148 #endif
149
150 int ehca2ib_return_code(u64 ehca_rc)
151 {
152         switch (ehca_rc) {
153         case H_SUCCESS:
154                 return 0;
155         case H_RESOURCE:             /* Resource in use */
156         case H_BUSY:
157                 return -EBUSY;
158         case H_NOT_ENOUGH_RESOURCES: /* insufficient resources */
159         case H_CONSTRAINED:          /* resource constraint */
160         case H_NO_MEM:
161                 return -ENOMEM;
162         default:
163                 return -EINVAL;
164         }
165 }
166
167 static int ehca_create_slab_caches(void)
168 {
169         int ret;
170
171         ret = ehca_init_pd_cache();
172         if (ret) {
173                 ehca_gen_err("Cannot create PD SLAB cache.");
174                 return ret;
175         }
176
177         ret = ehca_init_cq_cache();
178         if (ret) {
179                 ehca_gen_err("Cannot create CQ SLAB cache.");
180                 goto create_slab_caches2;
181         }
182
183         ret = ehca_init_qp_cache();
184         if (ret) {
185                 ehca_gen_err("Cannot create QP SLAB cache.");
186                 goto create_slab_caches3;
187         }
188
189         ret = ehca_init_av_cache();
190         if (ret) {
191                 ehca_gen_err("Cannot create AV SLAB cache.");
192                 goto create_slab_caches4;
193         }
194
195         ret = ehca_init_mrmw_cache();
196         if (ret) {
197                 ehca_gen_err("Cannot create MR&MW SLAB cache.");
198                 goto create_slab_caches5;
199         }
200
201         ret = ehca_init_small_qp_cache();
202         if (ret) {
203                 ehca_gen_err("Cannot create small queue SLAB cache.");
204                 goto create_slab_caches6;
205         }
206
207 #ifdef CONFIG_PPC_64K_PAGES
208         ctblk_cache = kmem_cache_create("ehca_cache_ctblk",
209                                         EHCA_PAGESIZE, H_CB_ALIGNMENT,
210                                         SLAB_HWCACHE_ALIGN,
211                                         NULL);
212         if (!ctblk_cache) {
213                 ehca_gen_err("Cannot create ctblk SLAB cache.");
214                 ehca_cleanup_small_qp_cache();
215                 ret = -ENOMEM;
216                 goto create_slab_caches6;
217         }
218 #endif
219         return 0;
220
221 create_slab_caches6:
222         ehca_cleanup_mrmw_cache();
223
224 create_slab_caches5:
225         ehca_cleanup_av_cache();
226
227 create_slab_caches4:
228         ehca_cleanup_qp_cache();
229
230 create_slab_caches3:
231         ehca_cleanup_cq_cache();
232
233 create_slab_caches2:
234         ehca_cleanup_pd_cache();
235
236         return ret;
237 }
238
239 static void ehca_destroy_slab_caches(void)
240 {
241         ehca_cleanup_small_qp_cache();
242         ehca_cleanup_mrmw_cache();
243         ehca_cleanup_av_cache();
244         ehca_cleanup_qp_cache();
245         ehca_cleanup_cq_cache();
246         ehca_cleanup_pd_cache();
247 #ifdef CONFIG_PPC_64K_PAGES
248         kmem_cache_destroy(ctblk_cache);
249 #endif
250 }
251
252 #define EHCA_HCAAVER  EHCA_BMASK_IBM(32, 39)
253 #define EHCA_REVID    EHCA_BMASK_IBM(40, 63)
254
255 static struct cap_descr {
256         u64 mask;
257         char *descr;
258 } hca_cap_descr[] = {
259         { HCA_CAP_AH_PORT_NR_CHECK, "HCA_CAP_AH_PORT_NR_CHECK" },
260         { HCA_CAP_ATOMIC, "HCA_CAP_ATOMIC" },
261         { HCA_CAP_AUTO_PATH_MIG, "HCA_CAP_AUTO_PATH_MIG" },
262         { HCA_CAP_BAD_P_KEY_CTR, "HCA_CAP_BAD_P_KEY_CTR" },
263         { HCA_CAP_SQD_RTS_PORT_CHANGE, "HCA_CAP_SQD_RTS_PORT_CHANGE" },
264         { HCA_CAP_CUR_QP_STATE_MOD, "HCA_CAP_CUR_QP_STATE_MOD" },
265         { HCA_CAP_INIT_TYPE, "HCA_CAP_INIT_TYPE" },
266         { HCA_CAP_PORT_ACTIVE_EVENT, "HCA_CAP_PORT_ACTIVE_EVENT" },
267         { HCA_CAP_Q_KEY_VIOL_CTR, "HCA_CAP_Q_KEY_VIOL_CTR" },
268         { HCA_CAP_WQE_RESIZE, "HCA_CAP_WQE_RESIZE" },
269         { HCA_CAP_RAW_PACKET_MCAST, "HCA_CAP_RAW_PACKET_MCAST" },
270         { HCA_CAP_SHUTDOWN_PORT, "HCA_CAP_SHUTDOWN_PORT" },
271         { HCA_CAP_RC_LL_QP, "HCA_CAP_RC_LL_QP" },
272         { HCA_CAP_SRQ, "HCA_CAP_SRQ" },
273         { HCA_CAP_UD_LL_QP, "HCA_CAP_UD_LL_QP" },
274         { HCA_CAP_RESIZE_MR, "HCA_CAP_RESIZE_MR" },
275         { HCA_CAP_MINI_QP, "HCA_CAP_MINI_QP" },
276         { HCA_CAP_H_ALLOC_RES_SYNC, "HCA_CAP_H_ALLOC_RES_SYNC" },
277 };
278
279 static int ehca_sense_attributes(struct ehca_shca *shca)
280 {
281         int i, ret = 0;
282         u64 h_ret;
283         struct hipz_query_hca *rblock;
284         struct hipz_query_port *port;
285         const char *loc_code;
286
287         static const u32 pgsize_map[] = {
288                 HCA_CAP_MR_PGSIZE_4K,  0x1000,
289                 HCA_CAP_MR_PGSIZE_64K, 0x10000,
290                 HCA_CAP_MR_PGSIZE_1M,  0x100000,
291                 HCA_CAP_MR_PGSIZE_16M, 0x1000000,
292         };
293
294         ehca_gen_dbg("Probing adapter %s...",
295                      shca->ofdev->dev.of_node->full_name);
296         loc_code = of_get_property(shca->ofdev->dev.of_node, "ibm,loc-code",
297                                    NULL);
298         if (loc_code)
299                 ehca_gen_dbg(" ... location lode=%s", loc_code);
300
301         rblock = ehca_alloc_fw_ctrlblock(GFP_KERNEL);
302         if (!rblock) {
303                 ehca_gen_err("Cannot allocate rblock memory.");
304                 return -ENOMEM;
305         }
306
307         h_ret = hipz_h_query_hca(shca->ipz_hca_handle, rblock);
308         if (h_ret != H_SUCCESS) {
309                 ehca_gen_err("Cannot query device properties. h_ret=%lli",
310                              h_ret);
311                 ret = -EPERM;
312                 goto sense_attributes1;
313         }
314
315         if (ehca_nr_ports == 1)
316                 shca->num_ports = 1;
317         else
318                 shca->num_ports = (u8)rblock->num_ports;
319
320         ehca_gen_dbg(" ... found %x ports", rblock->num_ports);
321
322         if (ehca_hw_level == 0) {
323                 u32 hcaaver;
324                 u32 revid;
325
326                 hcaaver = EHCA_BMASK_GET(EHCA_HCAAVER, rblock->hw_ver);
327                 revid   = EHCA_BMASK_GET(EHCA_REVID, rblock->hw_ver);
328
329                 ehca_gen_dbg(" ... hardware version=%x:%x", hcaaver, revid);
330
331                 if (hcaaver == 1) {
332                         if (revid <= 3)
333                                 shca->hw_level = 0x10 | (revid + 1);
334                         else
335                                 shca->hw_level = 0x14;
336                 } else if (hcaaver == 2) {
337                         if (revid == 0)
338                                 shca->hw_level = 0x21;
339                         else if (revid == 0x10)
340                                 shca->hw_level = 0x22;
341                         else if (revid == 0x20 || revid == 0x21)
342                                 shca->hw_level = 0x23;
343                 }
344
345                 if (!shca->hw_level) {
346                         ehca_gen_warn("unknown hardware version"
347                                       " - assuming default level");
348                         shca->hw_level = 0x22;
349                 }
350         } else
351                 shca->hw_level = ehca_hw_level;
352         ehca_gen_dbg(" ... hardware level=%x", shca->hw_level);
353
354         shca->hca_cap = rblock->hca_cap_indicators;
355         ehca_gen_dbg(" ... HCA capabilities:");
356         for (i = 0; i < ARRAY_SIZE(hca_cap_descr); i++)
357                 if (EHCA_BMASK_GET(hca_cap_descr[i].mask, shca->hca_cap))
358                         ehca_gen_dbg("   %s", hca_cap_descr[i].descr);
359
360         /* Autodetect hCall locking -- the "H_ALLOC_RESOURCE synced" flag is
361          * a firmware property, so it's valid across all adapters
362          */
363         if (ehca_lock_hcalls == -1)
364                 ehca_lock_hcalls = !EHCA_BMASK_GET(HCA_CAP_H_ALLOC_RES_SYNC,
365                                         shca->hca_cap);
366
367         /* translate supported MR page sizes; always support 4K */
368         shca->hca_cap_mr_pgsize = EHCA_PAGESIZE;
369         for (i = 0; i < ARRAY_SIZE(pgsize_map); i += 2)
370                 if (rblock->memory_page_size_supported & pgsize_map[i])
371                         shca->hca_cap_mr_pgsize |= pgsize_map[i + 1];
372
373         /* Set maximum number of CQs and QPs to calculate EQ size */
374         if (shca->max_num_qps == -1)
375                 shca->max_num_qps = min_t(int, rblock->max_qp,
376                                           EHCA_MAX_NUM_QUEUES);
377         else if (shca->max_num_qps < 1 || shca->max_num_qps > rblock->max_qp) {
378                 ehca_gen_warn("The requested number of QPs is out of range "
379                               "(1 - %i) specified by HW. Value is set to %i",
380                               rblock->max_qp, rblock->max_qp);
381                 shca->max_num_qps = rblock->max_qp;
382         }
383
384         if (shca->max_num_cqs == -1)
385                 shca->max_num_cqs = min_t(int, rblock->max_cq,
386                                           EHCA_MAX_NUM_QUEUES);
387         else if (shca->max_num_cqs < 1 || shca->max_num_cqs > rblock->max_cq) {
388                 ehca_gen_warn("The requested number of CQs is out of range "
389                               "(1 - %i) specified by HW. Value is set to %i",
390                               rblock->max_cq, rblock->max_cq);
391         }
392
393         /* query max MTU from first port -- it's the same for all ports */
394         port = (struct hipz_query_port *)rblock;
395         h_ret = hipz_h_query_port(shca->ipz_hca_handle, 1, port);
396         if (h_ret != H_SUCCESS) {
397                 ehca_gen_err("Cannot query port properties. h_ret=%lli",
398                              h_ret);
399                 ret = -EPERM;
400                 goto sense_attributes1;
401         }
402
403         shca->max_mtu = port->max_mtu;
404
405 sense_attributes1:
406         ehca_free_fw_ctrlblock(rblock);
407         return ret;
408 }
409
410 static int init_node_guid(struct ehca_shca *shca)
411 {
412         int ret = 0;
413         struct hipz_query_hca *rblock;
414
415         rblock = ehca_alloc_fw_ctrlblock(GFP_KERNEL);
416         if (!rblock) {
417                 ehca_err(&shca->ib_device, "Can't allocate rblock memory.");
418                 return -ENOMEM;
419         }
420
421         if (hipz_h_query_hca(shca->ipz_hca_handle, rblock) != H_SUCCESS) {
422                 ehca_err(&shca->ib_device, "Can't query device properties");
423                 ret = -EINVAL;
424                 goto init_node_guid1;
425         }
426
427         memcpy(&shca->ib_device.node_guid, &rblock->node_guid, sizeof(u64));
428
429 init_node_guid1:
430         ehca_free_fw_ctrlblock(rblock);
431         return ret;
432 }
433
434 static int ehca_port_immutable(struct ib_device *ibdev, u8 port_num,
435                                struct ib_port_immutable *immutable)
436 {
437         struct ib_port_attr attr;
438         int err;
439
440         err = ehca_query_port(ibdev, port_num, &attr);
441         if (err)
442                 return err;
443
444         immutable->pkey_tbl_len = attr.pkey_tbl_len;
445         immutable->gid_tbl_len = attr.gid_tbl_len;
446         immutable->core_cap_flags = RDMA_CORE_PORT_IBA_IB;
447         immutable->max_mad_size = IB_MGMT_MAD_SIZE;
448
449         return 0;
450 }
451
452 static int ehca_init_device(struct ehca_shca *shca)
453 {
454         int ret;
455
456         ret = init_node_guid(shca);
457         if (ret)
458                 return ret;
459
460         strlcpy(shca->ib_device.name, "ehca%d", IB_DEVICE_NAME_MAX);
461         shca->ib_device.owner               = THIS_MODULE;
462
463         shca->ib_device.uverbs_abi_ver      = 8;
464         shca->ib_device.uverbs_cmd_mask     =
465                 (1ull << IB_USER_VERBS_CMD_GET_CONTEXT)         |
466                 (1ull << IB_USER_VERBS_CMD_QUERY_DEVICE)        |
467                 (1ull << IB_USER_VERBS_CMD_QUERY_PORT)          |
468                 (1ull << IB_USER_VERBS_CMD_ALLOC_PD)            |
469                 (1ull << IB_USER_VERBS_CMD_DEALLOC_PD)          |
470                 (1ull << IB_USER_VERBS_CMD_REG_MR)              |
471                 (1ull << IB_USER_VERBS_CMD_DEREG_MR)            |
472                 (1ull << IB_USER_VERBS_CMD_CREATE_COMP_CHANNEL) |
473                 (1ull << IB_USER_VERBS_CMD_CREATE_CQ)           |
474                 (1ull << IB_USER_VERBS_CMD_DESTROY_CQ)          |
475                 (1ull << IB_USER_VERBS_CMD_CREATE_QP)           |
476                 (1ull << IB_USER_VERBS_CMD_MODIFY_QP)           |
477                 (1ull << IB_USER_VERBS_CMD_QUERY_QP)            |
478                 (1ull << IB_USER_VERBS_CMD_DESTROY_QP)          |
479                 (1ull << IB_USER_VERBS_CMD_ATTACH_MCAST)        |
480                 (1ull << IB_USER_VERBS_CMD_DETACH_MCAST);
481
482         shca->ib_device.node_type           = RDMA_NODE_IB_CA;
483         shca->ib_device.phys_port_cnt       = shca->num_ports;
484         shca->ib_device.num_comp_vectors    = 1;
485         shca->ib_device.dma_device          = &shca->ofdev->dev;
486         shca->ib_device.query_device        = ehca_query_device;
487         shca->ib_device.query_port          = ehca_query_port;
488         shca->ib_device.query_gid           = ehca_query_gid;
489         shca->ib_device.query_pkey          = ehca_query_pkey;
490         /* shca->in_device.modify_device    = ehca_modify_device    */
491         shca->ib_device.modify_port         = ehca_modify_port;
492         shca->ib_device.alloc_ucontext      = ehca_alloc_ucontext;
493         shca->ib_device.dealloc_ucontext    = ehca_dealloc_ucontext;
494         shca->ib_device.alloc_pd            = ehca_alloc_pd;
495         shca->ib_device.dealloc_pd          = ehca_dealloc_pd;
496         shca->ib_device.create_ah           = ehca_create_ah;
497         /* shca->ib_device.modify_ah        = ehca_modify_ah;       */
498         shca->ib_device.query_ah            = ehca_query_ah;
499         shca->ib_device.destroy_ah          = ehca_destroy_ah;
500         shca->ib_device.create_qp           = ehca_create_qp;
501         shca->ib_device.modify_qp           = ehca_modify_qp;
502         shca->ib_device.query_qp            = ehca_query_qp;
503         shca->ib_device.destroy_qp          = ehca_destroy_qp;
504         shca->ib_device.post_send           = ehca_post_send;
505         shca->ib_device.post_recv           = ehca_post_recv;
506         shca->ib_device.create_cq           = ehca_create_cq;
507         shca->ib_device.destroy_cq          = ehca_destroy_cq;
508         shca->ib_device.resize_cq           = ehca_resize_cq;
509         shca->ib_device.poll_cq             = ehca_poll_cq;
510         /* shca->ib_device.peek_cq          = ehca_peek_cq;         */
511         shca->ib_device.req_notify_cq       = ehca_req_notify_cq;
512         /* shca->ib_device.req_ncomp_notif  = ehca_req_ncomp_notif; */
513         shca->ib_device.get_dma_mr          = ehca_get_dma_mr;
514         shca->ib_device.reg_user_mr         = ehca_reg_user_mr;
515         shca->ib_device.dereg_mr            = ehca_dereg_mr;
516         shca->ib_device.alloc_mw            = ehca_alloc_mw;
517         shca->ib_device.dealloc_mw          = ehca_dealloc_mw;
518         shca->ib_device.alloc_fmr           = ehca_alloc_fmr;
519         shca->ib_device.map_phys_fmr        = ehca_map_phys_fmr;
520         shca->ib_device.unmap_fmr           = ehca_unmap_fmr;
521         shca->ib_device.dealloc_fmr         = ehca_dealloc_fmr;
522         shca->ib_device.attach_mcast        = ehca_attach_mcast;
523         shca->ib_device.detach_mcast        = ehca_detach_mcast;
524         shca->ib_device.process_mad         = ehca_process_mad;
525         shca->ib_device.mmap                = ehca_mmap;
526         shca->ib_device.dma_ops             = &ehca_dma_mapping_ops;
527         shca->ib_device.get_port_immutable  = ehca_port_immutable;
528
529         if (EHCA_BMASK_GET(HCA_CAP_SRQ, shca->hca_cap)) {
530                 shca->ib_device.uverbs_cmd_mask |=
531                         (1ull << IB_USER_VERBS_CMD_CREATE_SRQ) |
532                         (1ull << IB_USER_VERBS_CMD_MODIFY_SRQ) |
533                         (1ull << IB_USER_VERBS_CMD_QUERY_SRQ) |
534                         (1ull << IB_USER_VERBS_CMD_DESTROY_SRQ);
535
536                 shca->ib_device.create_srq          = ehca_create_srq;
537                 shca->ib_device.modify_srq          = ehca_modify_srq;
538                 shca->ib_device.query_srq           = ehca_query_srq;
539                 shca->ib_device.destroy_srq         = ehca_destroy_srq;
540                 shca->ib_device.post_srq_recv       = ehca_post_srq_recv;
541         }
542
543         return ret;
544 }
545
546 static int ehca_create_aqp1(struct ehca_shca *shca, u32 port)
547 {
548         struct ehca_sport *sport = &shca->sport[port - 1];
549         struct ib_cq *ibcq;
550         struct ib_qp *ibqp;
551         struct ib_qp_init_attr qp_init_attr;
552         struct ib_cq_init_attr cq_attr = {};
553         int ret;
554
555         if (sport->ibcq_aqp1) {
556                 ehca_err(&shca->ib_device, "AQP1 CQ is already created.");
557                 return -EPERM;
558         }
559
560         cq_attr.cqe = 10;
561         ibcq = ib_create_cq(&shca->ib_device, NULL, NULL, (void *)(-1),
562                             &cq_attr);
563         if (IS_ERR(ibcq)) {
564                 ehca_err(&shca->ib_device, "Cannot create AQP1 CQ.");
565                 return PTR_ERR(ibcq);
566         }
567         sport->ibcq_aqp1 = ibcq;
568
569         if (sport->ibqp_sqp[IB_QPT_GSI]) {
570                 ehca_err(&shca->ib_device, "AQP1 QP is already created.");
571                 ret = -EPERM;
572                 goto create_aqp1;
573         }
574
575         memset(&qp_init_attr, 0, sizeof(struct ib_qp_init_attr));
576         qp_init_attr.send_cq          = ibcq;
577         qp_init_attr.recv_cq          = ibcq;
578         qp_init_attr.sq_sig_type      = IB_SIGNAL_ALL_WR;
579         qp_init_attr.cap.max_send_wr  = 100;
580         qp_init_attr.cap.max_recv_wr  = 100;
581         qp_init_attr.cap.max_send_sge = 2;
582         qp_init_attr.cap.max_recv_sge = 1;
583         qp_init_attr.qp_type          = IB_QPT_GSI;
584         qp_init_attr.port_num         = port;
585         qp_init_attr.qp_context       = NULL;
586         qp_init_attr.event_handler    = NULL;
587         qp_init_attr.srq              = NULL;
588
589         ibqp = ib_create_qp(&shca->pd->ib_pd, &qp_init_attr);
590         if (IS_ERR(ibqp)) {
591                 ehca_err(&shca->ib_device, "Cannot create AQP1 QP.");
592                 ret = PTR_ERR(ibqp);
593                 goto create_aqp1;
594         }
595         sport->ibqp_sqp[IB_QPT_GSI] = ibqp;
596
597         return 0;
598
599 create_aqp1:
600         ib_destroy_cq(sport->ibcq_aqp1);
601         return ret;
602 }
603
604 static int ehca_destroy_aqp1(struct ehca_sport *sport)
605 {
606         int ret;
607
608         ret = ib_destroy_qp(sport->ibqp_sqp[IB_QPT_GSI]);
609         if (ret) {
610                 ehca_gen_err("Cannot destroy AQP1 QP. ret=%i", ret);
611                 return ret;
612         }
613
614         ret = ib_destroy_cq(sport->ibcq_aqp1);
615         if (ret)
616                 ehca_gen_err("Cannot destroy AQP1 CQ. ret=%i", ret);
617
618         return ret;
619 }
620
621 static ssize_t ehca_show_debug_level(struct device_driver *ddp, char *buf)
622 {
623         return snprintf(buf, PAGE_SIZE, "%d\n", ehca_debug_level);
624 }
625
626 static ssize_t ehca_store_debug_level(struct device_driver *ddp,
627                                       const char *buf, size_t count)
628 {
629         int value = (*buf) - '0';
630         if (value >= 0 && value <= 9)
631                 ehca_debug_level = value;
632         return 1;
633 }
634
635 static DRIVER_ATTR(debug_level, S_IRUSR | S_IWUSR,
636                    ehca_show_debug_level, ehca_store_debug_level);
637
638 static struct attribute *ehca_drv_attrs[] = {
639         &driver_attr_debug_level.attr,
640         NULL
641 };
642
643 static struct attribute_group ehca_drv_attr_grp = {
644         .attrs = ehca_drv_attrs
645 };
646
647 static const struct attribute_group *ehca_drv_attr_groups[] = {
648         &ehca_drv_attr_grp,
649         NULL,
650 };
651
652 #define EHCA_RESOURCE_ATTR(name)                                           \
653 static ssize_t  ehca_show_##name(struct device *dev,                       \
654                                  struct device_attribute *attr,            \
655                                  char *buf)                                \
656 {                                                                          \
657         struct ehca_shca *shca;                                            \
658         struct hipz_query_hca *rblock;                                     \
659         int data;                                                          \
660                                                                            \
661         shca = dev_get_drvdata(dev);                                       \
662                                                                            \
663         rblock = ehca_alloc_fw_ctrlblock(GFP_KERNEL);                      \
664         if (!rblock) {                                                     \
665                 dev_err(dev, "Can't allocate rblock memory.\n");           \
666                 return 0;                                                  \
667         }                                                                  \
668                                                                            \
669         if (hipz_h_query_hca(shca->ipz_hca_handle, rblock) != H_SUCCESS) { \
670                 dev_err(dev, "Can't query device properties\n");           \
671                 ehca_free_fw_ctrlblock(rblock);                            \
672                 return 0;                                                  \
673         }                                                                  \
674                                                                            \
675         data = rblock->name;                                               \
676         ehca_free_fw_ctrlblock(rblock);                                    \
677                                                                            \
678         if ((strcmp(#name, "num_ports") == 0) && (ehca_nr_ports == 1))     \
679                 return snprintf(buf, 256, "1\n");                          \
680         else                                                               \
681                 return snprintf(buf, 256, "%d\n", data);                   \
682                                                                            \
683 }                                                                          \
684 static DEVICE_ATTR(name, S_IRUGO, ehca_show_##name, NULL);
685
686 EHCA_RESOURCE_ATTR(num_ports);
687 EHCA_RESOURCE_ATTR(hw_ver);
688 EHCA_RESOURCE_ATTR(max_eq);
689 EHCA_RESOURCE_ATTR(cur_eq);
690 EHCA_RESOURCE_ATTR(max_cq);
691 EHCA_RESOURCE_ATTR(cur_cq);
692 EHCA_RESOURCE_ATTR(max_qp);
693 EHCA_RESOURCE_ATTR(cur_qp);
694 EHCA_RESOURCE_ATTR(max_mr);
695 EHCA_RESOURCE_ATTR(cur_mr);
696 EHCA_RESOURCE_ATTR(max_mw);
697 EHCA_RESOURCE_ATTR(cur_mw);
698 EHCA_RESOURCE_ATTR(max_pd);
699 EHCA_RESOURCE_ATTR(max_ah);
700
701 static ssize_t ehca_show_adapter_handle(struct device *dev,
702                                         struct device_attribute *attr,
703                                         char *buf)
704 {
705         struct ehca_shca *shca = dev_get_drvdata(dev);
706
707         return sprintf(buf, "%llx\n", shca->ipz_hca_handle.handle);
708
709 }
710 static DEVICE_ATTR(adapter_handle, S_IRUGO, ehca_show_adapter_handle, NULL);
711
712 static struct attribute *ehca_dev_attrs[] = {
713         &dev_attr_adapter_handle.attr,
714         &dev_attr_num_ports.attr,
715         &dev_attr_hw_ver.attr,
716         &dev_attr_max_eq.attr,
717         &dev_attr_cur_eq.attr,
718         &dev_attr_max_cq.attr,
719         &dev_attr_cur_cq.attr,
720         &dev_attr_max_qp.attr,
721         &dev_attr_cur_qp.attr,
722         &dev_attr_max_mr.attr,
723         &dev_attr_cur_mr.attr,
724         &dev_attr_max_mw.attr,
725         &dev_attr_cur_mw.attr,
726         &dev_attr_max_pd.attr,
727         &dev_attr_max_ah.attr,
728         NULL
729 };
730
731 static struct attribute_group ehca_dev_attr_grp = {
732         .attrs = ehca_dev_attrs
733 };
734
735 static int ehca_probe(struct platform_device *dev)
736 {
737         struct ehca_shca *shca;
738         const u64 *handle;
739         struct ib_pd *ibpd;
740         int ret, i, eq_size;
741         unsigned long flags;
742
743         handle = of_get_property(dev->dev.of_node, "ibm,hca-handle", NULL);
744         if (!handle) {
745                 ehca_gen_err("Cannot get eHCA handle for adapter: %s.",
746                              dev->dev.of_node->full_name);
747                 return -ENODEV;
748         }
749
750         if (!(*handle)) {
751                 ehca_gen_err("Wrong eHCA handle for adapter: %s.",
752                              dev->dev.of_node->full_name);
753                 return -ENODEV;
754         }
755
756         shca = (struct ehca_shca *)ib_alloc_device(sizeof(*shca));
757         if (!shca) {
758                 ehca_gen_err("Cannot allocate shca memory.");
759                 return -ENOMEM;
760         }
761
762         mutex_init(&shca->modify_mutex);
763         atomic_set(&shca->num_cqs, 0);
764         atomic_set(&shca->num_qps, 0);
765         shca->max_num_qps = ehca_max_qp;
766         shca->max_num_cqs = ehca_max_cq;
767
768         for (i = 0; i < ARRAY_SIZE(shca->sport); i++)
769                 spin_lock_init(&shca->sport[i].mod_sqp_lock);
770
771         shca->ofdev = dev;
772         shca->ipz_hca_handle.handle = *handle;
773         dev_set_drvdata(&dev->dev, shca);
774
775         ret = ehca_sense_attributes(shca);
776         if (ret < 0) {
777                 ehca_gen_err("Cannot sense eHCA attributes.");
778                 goto probe1;
779         }
780
781         ret = ehca_init_device(shca);
782         if (ret) {
783                 ehca_gen_err("Cannot init ehca  device struct");
784                 goto probe1;
785         }
786
787         eq_size = 2 * shca->max_num_cqs + 4 * shca->max_num_qps;
788         /* create event queues */
789         ret = ehca_create_eq(shca, &shca->eq, EHCA_EQ, eq_size);
790         if (ret) {
791                 ehca_err(&shca->ib_device, "Cannot create EQ.");
792                 goto probe1;
793         }
794
795         ret = ehca_create_eq(shca, &shca->neq, EHCA_NEQ, 513);
796         if (ret) {
797                 ehca_err(&shca->ib_device, "Cannot create NEQ.");
798                 goto probe3;
799         }
800
801         /* create internal protection domain */
802         ibpd = ehca_alloc_pd(&shca->ib_device, (void *)(-1), NULL);
803         if (IS_ERR(ibpd)) {
804                 ehca_err(&shca->ib_device, "Cannot create internal PD.");
805                 ret = PTR_ERR(ibpd);
806                 goto probe4;
807         }
808
809         shca->pd = container_of(ibpd, struct ehca_pd, ib_pd);
810         shca->pd->ib_pd.device = &shca->ib_device;
811
812         /* create internal max MR */
813         ret = ehca_reg_internal_maxmr(shca, shca->pd, &shca->maxmr);
814
815         if (ret) {
816                 ehca_err(&shca->ib_device, "Cannot create internal MR ret=%i",
817                          ret);
818                 goto probe5;
819         }
820
821         ret = ib_register_device(&shca->ib_device, NULL);
822         if (ret) {
823                 ehca_err(&shca->ib_device,
824                          "ib_register_device() failed ret=%i", ret);
825                 goto probe6;
826         }
827
828         /* create AQP1 for port 1 */
829         if (ehca_open_aqp1 == 1) {
830                 shca->sport[0].port_state = IB_PORT_DOWN;
831                 ret = ehca_create_aqp1(shca, 1);
832                 if (ret) {
833                         ehca_err(&shca->ib_device,
834                                  "Cannot create AQP1 for port 1.");
835                         goto probe7;
836                 }
837         }
838
839         /* create AQP1 for port 2 */
840         if ((ehca_open_aqp1 == 1) && (shca->num_ports == 2)) {
841                 shca->sport[1].port_state = IB_PORT_DOWN;
842                 ret = ehca_create_aqp1(shca, 2);
843                 if (ret) {
844                         ehca_err(&shca->ib_device,
845                                  "Cannot create AQP1 for port 2.");
846                         goto probe8;
847                 }
848         }
849
850         ret = sysfs_create_group(&dev->dev.kobj, &ehca_dev_attr_grp);
851         if (ret) /* only complain; we can live without attributes */
852                 ehca_err(&shca->ib_device,
853                          "Cannot create device attributes  ret=%d", ret);
854
855         spin_lock_irqsave(&shca_list_lock, flags);
856         list_add(&shca->shca_list, &shca_list);
857         spin_unlock_irqrestore(&shca_list_lock, flags);
858
859         return 0;
860
861 probe8:
862         ret = ehca_destroy_aqp1(&shca->sport[0]);
863         if (ret)
864                 ehca_err(&shca->ib_device,
865                          "Cannot destroy AQP1 for port 1. ret=%i", ret);
866
867 probe7:
868         ib_unregister_device(&shca->ib_device);
869
870 probe6:
871         ret = ehca_dereg_internal_maxmr(shca);
872         if (ret)
873                 ehca_err(&shca->ib_device,
874                          "Cannot destroy internal MR. ret=%x", ret);
875
876 probe5:
877         ret = ehca_dealloc_pd(&shca->pd->ib_pd);
878         if (ret)
879                 ehca_err(&shca->ib_device,
880                          "Cannot destroy internal PD. ret=%x", ret);
881
882 probe4:
883         ret = ehca_destroy_eq(shca, &shca->neq);
884         if (ret)
885                 ehca_err(&shca->ib_device,
886                          "Cannot destroy NEQ. ret=%x", ret);
887
888 probe3:
889         ret = ehca_destroy_eq(shca, &shca->eq);
890         if (ret)
891                 ehca_err(&shca->ib_device,
892                          "Cannot destroy EQ. ret=%x", ret);
893
894 probe1:
895         ib_dealloc_device(&shca->ib_device);
896
897         return -EINVAL;
898 }
899
900 static int ehca_remove(struct platform_device *dev)
901 {
902         struct ehca_shca *shca = dev_get_drvdata(&dev->dev);
903         unsigned long flags;
904         int ret;
905
906         sysfs_remove_group(&dev->dev.kobj, &ehca_dev_attr_grp);
907
908         if (ehca_open_aqp1 == 1) {
909                 int i;
910                 for (i = 0; i < shca->num_ports; i++) {
911                         ret = ehca_destroy_aqp1(&shca->sport[i]);
912                         if (ret)
913                                 ehca_err(&shca->ib_device,
914                                          "Cannot destroy AQP1 for port %x "
915                                          "ret=%i", ret, i);
916                 }
917         }
918
919         ib_unregister_device(&shca->ib_device);
920
921         ret = ehca_dereg_internal_maxmr(shca);
922         if (ret)
923                 ehca_err(&shca->ib_device,
924                          "Cannot destroy internal MR. ret=%i", ret);
925
926         ret = ehca_dealloc_pd(&shca->pd->ib_pd);
927         if (ret)
928                 ehca_err(&shca->ib_device,
929                          "Cannot destroy internal PD. ret=%i", ret);
930
931         ret = ehca_destroy_eq(shca, &shca->eq);
932         if (ret)
933                 ehca_err(&shca->ib_device, "Cannot destroy EQ. ret=%i", ret);
934
935         ret = ehca_destroy_eq(shca, &shca->neq);
936         if (ret)
937                 ehca_err(&shca->ib_device, "Canot destroy NEQ. ret=%i", ret);
938
939         ib_dealloc_device(&shca->ib_device);
940
941         spin_lock_irqsave(&shca_list_lock, flags);
942         list_del(&shca->shca_list);
943         spin_unlock_irqrestore(&shca_list_lock, flags);
944
945         return ret;
946 }
947
948 static struct of_device_id ehca_device_table[] =
949 {
950         {
951                 .name       = "lhca",
952                 .compatible = "IBM,lhca",
953         },
954         {},
955 };
956 MODULE_DEVICE_TABLE(of, ehca_device_table);
957
958 static struct platform_driver ehca_driver = {
959         .probe       = ehca_probe,
960         .remove      = ehca_remove,
961         .driver = {
962                 .name = "ehca",
963                 .owner = THIS_MODULE,
964                 .groups = ehca_drv_attr_groups,
965                 .of_match_table = ehca_device_table,
966         },
967 };
968
969 void ehca_poll_eqs(unsigned long data)
970 {
971         struct ehca_shca *shca;
972
973         spin_lock(&shca_list_lock);
974         list_for_each_entry(shca, &shca_list, shca_list) {
975                 if (shca->eq.is_initialized) {
976                         /* call deadman proc only if eq ptr does not change */
977                         struct ehca_eq *eq = &shca->eq;
978                         int max = 3;
979                         volatile u64 q_ofs, q_ofs2;
980                         unsigned long flags;
981                         spin_lock_irqsave(&eq->spinlock, flags);
982                         q_ofs = eq->ipz_queue.current_q_offset;
983                         spin_unlock_irqrestore(&eq->spinlock, flags);
984                         do {
985                                 spin_lock_irqsave(&eq->spinlock, flags);
986                                 q_ofs2 = eq->ipz_queue.current_q_offset;
987                                 spin_unlock_irqrestore(&eq->spinlock, flags);
988                                 max--;
989                         } while (q_ofs == q_ofs2 && max > 0);
990                         if (q_ofs == q_ofs2)
991                                 ehca_process_eq(shca, 0);
992                 }
993         }
994         mod_timer(&poll_eqs_timer, round_jiffies(jiffies + HZ));
995         spin_unlock(&shca_list_lock);
996 }
997
998 static int ehca_mem_notifier(struct notifier_block *nb,
999                              unsigned long action, void *data)
1000 {
1001         static unsigned long ehca_dmem_warn_time;
1002         unsigned long flags;
1003
1004         switch (action) {
1005         case MEM_CANCEL_OFFLINE:
1006         case MEM_CANCEL_ONLINE:
1007         case MEM_ONLINE:
1008         case MEM_OFFLINE:
1009                 return NOTIFY_OK;
1010         case MEM_GOING_ONLINE:
1011         case MEM_GOING_OFFLINE:
1012                 /* only ok if no hca is attached to the lpar */
1013                 spin_lock_irqsave(&shca_list_lock, flags);
1014                 if (list_empty(&shca_list)) {
1015                         spin_unlock_irqrestore(&shca_list_lock, flags);
1016                         return NOTIFY_OK;
1017                 } else {
1018                         spin_unlock_irqrestore(&shca_list_lock, flags);
1019                         if (printk_timed_ratelimit(&ehca_dmem_warn_time,
1020                                                    30 * 1000))
1021                                 ehca_gen_err("DMEM operations are not allowed"
1022                                              "in conjunction with eHCA");
1023                         return NOTIFY_BAD;
1024                 }
1025         }
1026         return NOTIFY_OK;
1027 }
1028
1029 static struct notifier_block ehca_mem_nb = {
1030         .notifier_call = ehca_mem_notifier,
1031 };
1032
1033 static int __init ehca_module_init(void)
1034 {
1035         int ret;
1036
1037         printk(KERN_INFO "eHCA Infiniband Device Driver "
1038                "(Version " HCAD_VERSION ")\n");
1039
1040         ret = ehca_create_comp_pool();
1041         if (ret) {
1042                 ehca_gen_err("Cannot create comp pool.");
1043                 return ret;
1044         }
1045
1046         ret = ehca_create_slab_caches();
1047         if (ret) {
1048                 ehca_gen_err("Cannot create SLAB caches");
1049                 ret = -ENOMEM;
1050                 goto module_init1;
1051         }
1052
1053         ret = ehca_create_busmap();
1054         if (ret) {
1055                 ehca_gen_err("Cannot create busmap.");
1056                 goto module_init2;
1057         }
1058
1059         ret = ibmebus_register_driver(&ehca_driver);
1060         if (ret) {
1061                 ehca_gen_err("Cannot register eHCA device driver");
1062                 ret = -EINVAL;
1063                 goto module_init3;
1064         }
1065
1066         ret = register_memory_notifier(&ehca_mem_nb);
1067         if (ret) {
1068                 ehca_gen_err("Failed registering memory add/remove notifier");
1069                 goto module_init4;
1070         }
1071
1072         if (ehca_poll_all_eqs != 1) {
1073                 ehca_gen_err("WARNING!!!");
1074                 ehca_gen_err("It is possible to lose interrupts.");
1075         } else {
1076                 init_timer(&poll_eqs_timer);
1077                 poll_eqs_timer.function = ehca_poll_eqs;
1078                 poll_eqs_timer.expires = jiffies + HZ;
1079                 add_timer(&poll_eqs_timer);
1080         }
1081
1082         return 0;
1083
1084 module_init4:
1085         ibmebus_unregister_driver(&ehca_driver);
1086
1087 module_init3:
1088         ehca_destroy_busmap();
1089
1090 module_init2:
1091         ehca_destroy_slab_caches();
1092
1093 module_init1:
1094         ehca_destroy_comp_pool();
1095         return ret;
1096 };
1097
1098 static void __exit ehca_module_exit(void)
1099 {
1100         if (ehca_poll_all_eqs == 1)
1101                 del_timer_sync(&poll_eqs_timer);
1102
1103         ibmebus_unregister_driver(&ehca_driver);
1104
1105         unregister_memory_notifier(&ehca_mem_nb);
1106
1107         ehca_destroy_busmap();
1108
1109         ehca_destroy_slab_caches();
1110
1111         ehca_destroy_comp_pool();
1112
1113         idr_destroy(&ehca_cq_idr);
1114         idr_destroy(&ehca_qp_idr);
1115 };
1116
1117 module_init(ehca_module_init);
1118 module_exit(ehca_module_exit);