Merge branches 'mlx5', 'qib' and 'srp' into for-next
[linux-2.6-block.git] / drivers / infiniband / hw / ehca / ehca_main.c
1 /*
2  *  IBM eServer eHCA Infiniband device driver for Linux on POWER
3  *
4  *  module start stop, hca detection
5  *
6  *  Authors: Heiko J Schick <schickhj@de.ibm.com>
7  *           Hoang-Nam Nguyen <hnguyen@de.ibm.com>
8  *           Joachim Fenkes <fenkes@de.ibm.com>
9  *
10  *  Copyright (c) 2005 IBM Corporation
11  *
12  *  All rights reserved.
13  *
14  *  This source code is distributed under a dual license of GPL v2.0 and OpenIB
15  *  BSD.
16  *
17  * OpenIB BSD License
18  *
19  * Redistribution and use in source and binary forms, with or without
20  * modification, are permitted provided that the following conditions are met:
21  *
22  * Redistributions of source code must retain the above copyright notice, this
23  * list of conditions and the following disclaimer.
24  *
25  * Redistributions in binary form must reproduce the above copyright notice,
26  * this list of conditions and the following disclaimer in the documentation
27  * and/or other materials
28  * provided with the distribution.
29  *
30  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
31  * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
32  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
33  * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
34  * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
35  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
36  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
37  * BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER
38  * IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
39  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
40  * POSSIBILITY OF SUCH DAMAGE.
41  */
42
43 #ifdef CONFIG_PPC_64K_PAGES
44 #include <linux/slab.h>
45 #endif
46
47 #include <linux/notifier.h>
48 #include <linux/memory.h>
49 #include "ehca_classes.h"
50 #include "ehca_iverbs.h"
51 #include "ehca_mrmw.h"
52 #include "ehca_tools.h"
53 #include "hcp_if.h"
54
55 #define HCAD_VERSION "0029"
56
57 MODULE_LICENSE("Dual BSD/GPL");
58 MODULE_AUTHOR("Christoph Raisch <raisch@de.ibm.com>");
59 MODULE_DESCRIPTION("IBM eServer HCA InfiniBand Device Driver");
60 MODULE_VERSION(HCAD_VERSION);
61
62 static bool ehca_open_aqp1    = 0;
63 static int ehca_hw_level      = 0;
64 static bool ehca_poll_all_eqs = 1;
65
66 int ehca_debug_level   = 0;
67 int ehca_nr_ports      = -1;
68 bool ehca_use_hp_mr    = 0;
69 int ehca_port_act_time = 30;
70 int ehca_static_rate   = -1;
71 bool ehca_scaling_code = 0;
72 int ehca_lock_hcalls   = -1;
73 int ehca_max_cq        = -1;
74 int ehca_max_qp        = -1;
75
76 module_param_named(open_aqp1,     ehca_open_aqp1,     bool, S_IRUGO);
77 module_param_named(debug_level,   ehca_debug_level,   int,  S_IRUGO);
78 module_param_named(hw_level,      ehca_hw_level,      int,  S_IRUGO);
79 module_param_named(nr_ports,      ehca_nr_ports,      int,  S_IRUGO);
80 module_param_named(use_hp_mr,     ehca_use_hp_mr,     bool, S_IRUGO);
81 module_param_named(port_act_time, ehca_port_act_time, int,  S_IRUGO);
82 module_param_named(poll_all_eqs,  ehca_poll_all_eqs,  bool, S_IRUGO);
83 module_param_named(static_rate,   ehca_static_rate,   int,  S_IRUGO);
84 module_param_named(scaling_code,  ehca_scaling_code,  bool, S_IRUGO);
85 module_param_named(lock_hcalls,   ehca_lock_hcalls,   bint, S_IRUGO);
86 module_param_named(number_of_cqs, ehca_max_cq,        int,  S_IRUGO);
87 module_param_named(number_of_qps, ehca_max_qp,        int,  S_IRUGO);
88
89 MODULE_PARM_DESC(open_aqp1,
90                  "Open AQP1 on startup (default: no)");
91 MODULE_PARM_DESC(debug_level,
92                  "Amount of debug output (0: none (default), 1: traces, "
93                  "2: some dumps, 3: lots)");
94 MODULE_PARM_DESC(hw_level,
95                  "Hardware level (0: autosensing (default), "
96                  "0x10..0x14: eHCA, 0x20..0x23: eHCA2)");
97 MODULE_PARM_DESC(nr_ports,
98                  "number of connected ports (-1: autodetect (default), "
99                  "1: port one only, 2: two ports)");
100 MODULE_PARM_DESC(use_hp_mr,
101                  "Use high performance MRs (default: no)");
102 MODULE_PARM_DESC(port_act_time,
103                  "Time to wait for port activation (default: 30 sec)");
104 MODULE_PARM_DESC(poll_all_eqs,
105                  "Poll all event queues periodically (default: yes)");
106 MODULE_PARM_DESC(static_rate,
107                  "Set permanent static rate (default: no static rate)");
108 MODULE_PARM_DESC(scaling_code,
109                  "Enable scaling code (default: no)");
110 MODULE_PARM_DESC(lock_hcalls,
111                  "Serialize all hCalls made by the driver "
112                  "(default: autodetect)");
113 MODULE_PARM_DESC(number_of_cqs,
114                 "Max number of CQs which can be allocated "
115                 "(default: autodetect)");
116 MODULE_PARM_DESC(number_of_qps,
117                 "Max number of QPs which can be allocated "
118                 "(default: autodetect)");
119
120 DEFINE_RWLOCK(ehca_qp_idr_lock);
121 DEFINE_RWLOCK(ehca_cq_idr_lock);
122 DEFINE_IDR(ehca_qp_idr);
123 DEFINE_IDR(ehca_cq_idr);
124
125 static LIST_HEAD(shca_list); /* list of all registered ehcas */
126 DEFINE_SPINLOCK(shca_list_lock);
127
128 static struct timer_list poll_eqs_timer;
129
130 #ifdef CONFIG_PPC_64K_PAGES
131 static struct kmem_cache *ctblk_cache;
132
133 void *ehca_alloc_fw_ctrlblock(gfp_t flags)
134 {
135         void *ret = kmem_cache_zalloc(ctblk_cache, flags);
136         if (!ret)
137                 ehca_gen_err("Out of memory for ctblk");
138         return ret;
139 }
140
141 void ehca_free_fw_ctrlblock(void *ptr)
142 {
143         if (ptr)
144                 kmem_cache_free(ctblk_cache, ptr);
145
146 }
147 #endif
148
149 int ehca2ib_return_code(u64 ehca_rc)
150 {
151         switch (ehca_rc) {
152         case H_SUCCESS:
153                 return 0;
154         case H_RESOURCE:             /* Resource in use */
155         case H_BUSY:
156                 return -EBUSY;
157         case H_NOT_ENOUGH_RESOURCES: /* insufficient resources */
158         case H_CONSTRAINED:          /* resource constraint */
159         case H_NO_MEM:
160                 return -ENOMEM;
161         default:
162                 return -EINVAL;
163         }
164 }
165
166 static int ehca_create_slab_caches(void)
167 {
168         int ret;
169
170         ret = ehca_init_pd_cache();
171         if (ret) {
172                 ehca_gen_err("Cannot create PD SLAB cache.");
173                 return ret;
174         }
175
176         ret = ehca_init_cq_cache();
177         if (ret) {
178                 ehca_gen_err("Cannot create CQ SLAB cache.");
179                 goto create_slab_caches2;
180         }
181
182         ret = ehca_init_qp_cache();
183         if (ret) {
184                 ehca_gen_err("Cannot create QP SLAB cache.");
185                 goto create_slab_caches3;
186         }
187
188         ret = ehca_init_av_cache();
189         if (ret) {
190                 ehca_gen_err("Cannot create AV SLAB cache.");
191                 goto create_slab_caches4;
192         }
193
194         ret = ehca_init_mrmw_cache();
195         if (ret) {
196                 ehca_gen_err("Cannot create MR&MW SLAB cache.");
197                 goto create_slab_caches5;
198         }
199
200         ret = ehca_init_small_qp_cache();
201         if (ret) {
202                 ehca_gen_err("Cannot create small queue SLAB cache.");
203                 goto create_slab_caches6;
204         }
205
206 #ifdef CONFIG_PPC_64K_PAGES
207         ctblk_cache = kmem_cache_create("ehca_cache_ctblk",
208                                         EHCA_PAGESIZE, H_CB_ALIGNMENT,
209                                         SLAB_HWCACHE_ALIGN,
210                                         NULL);
211         if (!ctblk_cache) {
212                 ehca_gen_err("Cannot create ctblk SLAB cache.");
213                 ehca_cleanup_small_qp_cache();
214                 ret = -ENOMEM;
215                 goto create_slab_caches6;
216         }
217 #endif
218         return 0;
219
220 create_slab_caches6:
221         ehca_cleanup_mrmw_cache();
222
223 create_slab_caches5:
224         ehca_cleanup_av_cache();
225
226 create_slab_caches4:
227         ehca_cleanup_qp_cache();
228
229 create_slab_caches3:
230         ehca_cleanup_cq_cache();
231
232 create_slab_caches2:
233         ehca_cleanup_pd_cache();
234
235         return ret;
236 }
237
238 static void ehca_destroy_slab_caches(void)
239 {
240         ehca_cleanup_small_qp_cache();
241         ehca_cleanup_mrmw_cache();
242         ehca_cleanup_av_cache();
243         ehca_cleanup_qp_cache();
244         ehca_cleanup_cq_cache();
245         ehca_cleanup_pd_cache();
246 #ifdef CONFIG_PPC_64K_PAGES
247         if (ctblk_cache)
248                 kmem_cache_destroy(ctblk_cache);
249 #endif
250 }
251
252 #define EHCA_HCAAVER  EHCA_BMASK_IBM(32, 39)
253 #define EHCA_REVID    EHCA_BMASK_IBM(40, 63)
254
255 static struct cap_descr {
256         u64 mask;
257         char *descr;
258 } hca_cap_descr[] = {
259         { HCA_CAP_AH_PORT_NR_CHECK, "HCA_CAP_AH_PORT_NR_CHECK" },
260         { HCA_CAP_ATOMIC, "HCA_CAP_ATOMIC" },
261         { HCA_CAP_AUTO_PATH_MIG, "HCA_CAP_AUTO_PATH_MIG" },
262         { HCA_CAP_BAD_P_KEY_CTR, "HCA_CAP_BAD_P_KEY_CTR" },
263         { HCA_CAP_SQD_RTS_PORT_CHANGE, "HCA_CAP_SQD_RTS_PORT_CHANGE" },
264         { HCA_CAP_CUR_QP_STATE_MOD, "HCA_CAP_CUR_QP_STATE_MOD" },
265         { HCA_CAP_INIT_TYPE, "HCA_CAP_INIT_TYPE" },
266         { HCA_CAP_PORT_ACTIVE_EVENT, "HCA_CAP_PORT_ACTIVE_EVENT" },
267         { HCA_CAP_Q_KEY_VIOL_CTR, "HCA_CAP_Q_KEY_VIOL_CTR" },
268         { HCA_CAP_WQE_RESIZE, "HCA_CAP_WQE_RESIZE" },
269         { HCA_CAP_RAW_PACKET_MCAST, "HCA_CAP_RAW_PACKET_MCAST" },
270         { HCA_CAP_SHUTDOWN_PORT, "HCA_CAP_SHUTDOWN_PORT" },
271         { HCA_CAP_RC_LL_QP, "HCA_CAP_RC_LL_QP" },
272         { HCA_CAP_SRQ, "HCA_CAP_SRQ" },
273         { HCA_CAP_UD_LL_QP, "HCA_CAP_UD_LL_QP" },
274         { HCA_CAP_RESIZE_MR, "HCA_CAP_RESIZE_MR" },
275         { HCA_CAP_MINI_QP, "HCA_CAP_MINI_QP" },
276         { HCA_CAP_H_ALLOC_RES_SYNC, "HCA_CAP_H_ALLOC_RES_SYNC" },
277 };
278
279 static int ehca_sense_attributes(struct ehca_shca *shca)
280 {
281         int i, ret = 0;
282         u64 h_ret;
283         struct hipz_query_hca *rblock;
284         struct hipz_query_port *port;
285         const char *loc_code;
286
287         static const u32 pgsize_map[] = {
288                 HCA_CAP_MR_PGSIZE_4K,  0x1000,
289                 HCA_CAP_MR_PGSIZE_64K, 0x10000,
290                 HCA_CAP_MR_PGSIZE_1M,  0x100000,
291                 HCA_CAP_MR_PGSIZE_16M, 0x1000000,
292         };
293
294         ehca_gen_dbg("Probing adapter %s...",
295                      shca->ofdev->dev.of_node->full_name);
296         loc_code = of_get_property(shca->ofdev->dev.of_node, "ibm,loc-code",
297                                    NULL);
298         if (loc_code)
299                 ehca_gen_dbg(" ... location lode=%s", loc_code);
300
301         rblock = ehca_alloc_fw_ctrlblock(GFP_KERNEL);
302         if (!rblock) {
303                 ehca_gen_err("Cannot allocate rblock memory.");
304                 return -ENOMEM;
305         }
306
307         h_ret = hipz_h_query_hca(shca->ipz_hca_handle, rblock);
308         if (h_ret != H_SUCCESS) {
309                 ehca_gen_err("Cannot query device properties. h_ret=%lli",
310                              h_ret);
311                 ret = -EPERM;
312                 goto sense_attributes1;
313         }
314
315         if (ehca_nr_ports == 1)
316                 shca->num_ports = 1;
317         else
318                 shca->num_ports = (u8)rblock->num_ports;
319
320         ehca_gen_dbg(" ... found %x ports", rblock->num_ports);
321
322         if (ehca_hw_level == 0) {
323                 u32 hcaaver;
324                 u32 revid;
325
326                 hcaaver = EHCA_BMASK_GET(EHCA_HCAAVER, rblock->hw_ver);
327                 revid   = EHCA_BMASK_GET(EHCA_REVID, rblock->hw_ver);
328
329                 ehca_gen_dbg(" ... hardware version=%x:%x", hcaaver, revid);
330
331                 if (hcaaver == 1) {
332                         if (revid <= 3)
333                                 shca->hw_level = 0x10 | (revid + 1);
334                         else
335                                 shca->hw_level = 0x14;
336                 } else if (hcaaver == 2) {
337                         if (revid == 0)
338                                 shca->hw_level = 0x21;
339                         else if (revid == 0x10)
340                                 shca->hw_level = 0x22;
341                         else if (revid == 0x20 || revid == 0x21)
342                                 shca->hw_level = 0x23;
343                 }
344
345                 if (!shca->hw_level) {
346                         ehca_gen_warn("unknown hardware version"
347                                       " - assuming default level");
348                         shca->hw_level = 0x22;
349                 }
350         } else
351                 shca->hw_level = ehca_hw_level;
352         ehca_gen_dbg(" ... hardware level=%x", shca->hw_level);
353
354         shca->hca_cap = rblock->hca_cap_indicators;
355         ehca_gen_dbg(" ... HCA capabilities:");
356         for (i = 0; i < ARRAY_SIZE(hca_cap_descr); i++)
357                 if (EHCA_BMASK_GET(hca_cap_descr[i].mask, shca->hca_cap))
358                         ehca_gen_dbg("   %s", hca_cap_descr[i].descr);
359
360         /* Autodetect hCall locking -- the "H_ALLOC_RESOURCE synced" flag is
361          * a firmware property, so it's valid across all adapters
362          */
363         if (ehca_lock_hcalls == -1)
364                 ehca_lock_hcalls = !EHCA_BMASK_GET(HCA_CAP_H_ALLOC_RES_SYNC,
365                                         shca->hca_cap);
366
367         /* translate supported MR page sizes; always support 4K */
368         shca->hca_cap_mr_pgsize = EHCA_PAGESIZE;
369         for (i = 0; i < ARRAY_SIZE(pgsize_map); i += 2)
370                 if (rblock->memory_page_size_supported & pgsize_map[i])
371                         shca->hca_cap_mr_pgsize |= pgsize_map[i + 1];
372
373         /* Set maximum number of CQs and QPs to calculate EQ size */
374         if (shca->max_num_qps == -1)
375                 shca->max_num_qps = min_t(int, rblock->max_qp,
376                                           EHCA_MAX_NUM_QUEUES);
377         else if (shca->max_num_qps < 1 || shca->max_num_qps > rblock->max_qp) {
378                 ehca_gen_warn("The requested number of QPs is out of range "
379                               "(1 - %i) specified by HW. Value is set to %i",
380                               rblock->max_qp, rblock->max_qp);
381                 shca->max_num_qps = rblock->max_qp;
382         }
383
384         if (shca->max_num_cqs == -1)
385                 shca->max_num_cqs = min_t(int, rblock->max_cq,
386                                           EHCA_MAX_NUM_QUEUES);
387         else if (shca->max_num_cqs < 1 || shca->max_num_cqs > rblock->max_cq) {
388                 ehca_gen_warn("The requested number of CQs is out of range "
389                               "(1 - %i) specified by HW. Value is set to %i",
390                               rblock->max_cq, rblock->max_cq);
391         }
392
393         /* query max MTU from first port -- it's the same for all ports */
394         port = (struct hipz_query_port *)rblock;
395         h_ret = hipz_h_query_port(shca->ipz_hca_handle, 1, port);
396         if (h_ret != H_SUCCESS) {
397                 ehca_gen_err("Cannot query port properties. h_ret=%lli",
398                              h_ret);
399                 ret = -EPERM;
400                 goto sense_attributes1;
401         }
402
403         shca->max_mtu = port->max_mtu;
404
405 sense_attributes1:
406         ehca_free_fw_ctrlblock(rblock);
407         return ret;
408 }
409
410 static int init_node_guid(struct ehca_shca *shca)
411 {
412         int ret = 0;
413         struct hipz_query_hca *rblock;
414
415         rblock = ehca_alloc_fw_ctrlblock(GFP_KERNEL);
416         if (!rblock) {
417                 ehca_err(&shca->ib_device, "Can't allocate rblock memory.");
418                 return -ENOMEM;
419         }
420
421         if (hipz_h_query_hca(shca->ipz_hca_handle, rblock) != H_SUCCESS) {
422                 ehca_err(&shca->ib_device, "Can't query device properties");
423                 ret = -EINVAL;
424                 goto init_node_guid1;
425         }
426
427         memcpy(&shca->ib_device.node_guid, &rblock->node_guid, sizeof(u64));
428
429 init_node_guid1:
430         ehca_free_fw_ctrlblock(rblock);
431         return ret;
432 }
433
434 static int ehca_init_device(struct ehca_shca *shca)
435 {
436         int ret;
437
438         ret = init_node_guid(shca);
439         if (ret)
440                 return ret;
441
442         strlcpy(shca->ib_device.name, "ehca%d", IB_DEVICE_NAME_MAX);
443         shca->ib_device.owner               = THIS_MODULE;
444
445         shca->ib_device.uverbs_abi_ver      = 8;
446         shca->ib_device.uverbs_cmd_mask     =
447                 (1ull << IB_USER_VERBS_CMD_GET_CONTEXT)         |
448                 (1ull << IB_USER_VERBS_CMD_QUERY_DEVICE)        |
449                 (1ull << IB_USER_VERBS_CMD_QUERY_PORT)          |
450                 (1ull << IB_USER_VERBS_CMD_ALLOC_PD)            |
451                 (1ull << IB_USER_VERBS_CMD_DEALLOC_PD)          |
452                 (1ull << IB_USER_VERBS_CMD_REG_MR)              |
453                 (1ull << IB_USER_VERBS_CMD_DEREG_MR)            |
454                 (1ull << IB_USER_VERBS_CMD_CREATE_COMP_CHANNEL) |
455                 (1ull << IB_USER_VERBS_CMD_CREATE_CQ)           |
456                 (1ull << IB_USER_VERBS_CMD_DESTROY_CQ)          |
457                 (1ull << IB_USER_VERBS_CMD_CREATE_QP)           |
458                 (1ull << IB_USER_VERBS_CMD_MODIFY_QP)           |
459                 (1ull << IB_USER_VERBS_CMD_QUERY_QP)            |
460                 (1ull << IB_USER_VERBS_CMD_DESTROY_QP)          |
461                 (1ull << IB_USER_VERBS_CMD_ATTACH_MCAST)        |
462                 (1ull << IB_USER_VERBS_CMD_DETACH_MCAST);
463
464         shca->ib_device.node_type           = RDMA_NODE_IB_CA;
465         shca->ib_device.phys_port_cnt       = shca->num_ports;
466         shca->ib_device.num_comp_vectors    = 1;
467         shca->ib_device.dma_device          = &shca->ofdev->dev;
468         shca->ib_device.query_device        = ehca_query_device;
469         shca->ib_device.query_port          = ehca_query_port;
470         shca->ib_device.query_gid           = ehca_query_gid;
471         shca->ib_device.query_pkey          = ehca_query_pkey;
472         /* shca->in_device.modify_device    = ehca_modify_device    */
473         shca->ib_device.modify_port         = ehca_modify_port;
474         shca->ib_device.alloc_ucontext      = ehca_alloc_ucontext;
475         shca->ib_device.dealloc_ucontext    = ehca_dealloc_ucontext;
476         shca->ib_device.alloc_pd            = ehca_alloc_pd;
477         shca->ib_device.dealloc_pd          = ehca_dealloc_pd;
478         shca->ib_device.create_ah           = ehca_create_ah;
479         /* shca->ib_device.modify_ah        = ehca_modify_ah;       */
480         shca->ib_device.query_ah            = ehca_query_ah;
481         shca->ib_device.destroy_ah          = ehca_destroy_ah;
482         shca->ib_device.create_qp           = ehca_create_qp;
483         shca->ib_device.modify_qp           = ehca_modify_qp;
484         shca->ib_device.query_qp            = ehca_query_qp;
485         shca->ib_device.destroy_qp          = ehca_destroy_qp;
486         shca->ib_device.post_send           = ehca_post_send;
487         shca->ib_device.post_recv           = ehca_post_recv;
488         shca->ib_device.create_cq           = ehca_create_cq;
489         shca->ib_device.destroy_cq          = ehca_destroy_cq;
490         shca->ib_device.resize_cq           = ehca_resize_cq;
491         shca->ib_device.poll_cq             = ehca_poll_cq;
492         /* shca->ib_device.peek_cq          = ehca_peek_cq;         */
493         shca->ib_device.req_notify_cq       = ehca_req_notify_cq;
494         /* shca->ib_device.req_ncomp_notif  = ehca_req_ncomp_notif; */
495         shca->ib_device.get_dma_mr          = ehca_get_dma_mr;
496         shca->ib_device.reg_phys_mr         = ehca_reg_phys_mr;
497         shca->ib_device.reg_user_mr         = ehca_reg_user_mr;
498         shca->ib_device.query_mr            = ehca_query_mr;
499         shca->ib_device.dereg_mr            = ehca_dereg_mr;
500         shca->ib_device.rereg_phys_mr       = ehca_rereg_phys_mr;
501         shca->ib_device.alloc_mw            = ehca_alloc_mw;
502         shca->ib_device.bind_mw             = ehca_bind_mw;
503         shca->ib_device.dealloc_mw          = ehca_dealloc_mw;
504         shca->ib_device.alloc_fmr           = ehca_alloc_fmr;
505         shca->ib_device.map_phys_fmr        = ehca_map_phys_fmr;
506         shca->ib_device.unmap_fmr           = ehca_unmap_fmr;
507         shca->ib_device.dealloc_fmr         = ehca_dealloc_fmr;
508         shca->ib_device.attach_mcast        = ehca_attach_mcast;
509         shca->ib_device.detach_mcast        = ehca_detach_mcast;
510         shca->ib_device.process_mad         = ehca_process_mad;
511         shca->ib_device.mmap                = ehca_mmap;
512         shca->ib_device.dma_ops             = &ehca_dma_mapping_ops;
513
514         if (EHCA_BMASK_GET(HCA_CAP_SRQ, shca->hca_cap)) {
515                 shca->ib_device.uverbs_cmd_mask |=
516                         (1ull << IB_USER_VERBS_CMD_CREATE_SRQ) |
517                         (1ull << IB_USER_VERBS_CMD_MODIFY_SRQ) |
518                         (1ull << IB_USER_VERBS_CMD_QUERY_SRQ) |
519                         (1ull << IB_USER_VERBS_CMD_DESTROY_SRQ);
520
521                 shca->ib_device.create_srq          = ehca_create_srq;
522                 shca->ib_device.modify_srq          = ehca_modify_srq;
523                 shca->ib_device.query_srq           = ehca_query_srq;
524                 shca->ib_device.destroy_srq         = ehca_destroy_srq;
525                 shca->ib_device.post_srq_recv       = ehca_post_srq_recv;
526         }
527
528         return ret;
529 }
530
531 static int ehca_create_aqp1(struct ehca_shca *shca, u32 port)
532 {
533         struct ehca_sport *sport = &shca->sport[port - 1];
534         struct ib_cq *ibcq;
535         struct ib_qp *ibqp;
536         struct ib_qp_init_attr qp_init_attr;
537         int ret;
538
539         if (sport->ibcq_aqp1) {
540                 ehca_err(&shca->ib_device, "AQP1 CQ is already created.");
541                 return -EPERM;
542         }
543
544         ibcq = ib_create_cq(&shca->ib_device, NULL, NULL, (void *)(-1), 10, 0);
545         if (IS_ERR(ibcq)) {
546                 ehca_err(&shca->ib_device, "Cannot create AQP1 CQ.");
547                 return PTR_ERR(ibcq);
548         }
549         sport->ibcq_aqp1 = ibcq;
550
551         if (sport->ibqp_sqp[IB_QPT_GSI]) {
552                 ehca_err(&shca->ib_device, "AQP1 QP is already created.");
553                 ret = -EPERM;
554                 goto create_aqp1;
555         }
556
557         memset(&qp_init_attr, 0, sizeof(struct ib_qp_init_attr));
558         qp_init_attr.send_cq          = ibcq;
559         qp_init_attr.recv_cq          = ibcq;
560         qp_init_attr.sq_sig_type      = IB_SIGNAL_ALL_WR;
561         qp_init_attr.cap.max_send_wr  = 100;
562         qp_init_attr.cap.max_recv_wr  = 100;
563         qp_init_attr.cap.max_send_sge = 2;
564         qp_init_attr.cap.max_recv_sge = 1;
565         qp_init_attr.qp_type          = IB_QPT_GSI;
566         qp_init_attr.port_num         = port;
567         qp_init_attr.qp_context       = NULL;
568         qp_init_attr.event_handler    = NULL;
569         qp_init_attr.srq              = NULL;
570
571         ibqp = ib_create_qp(&shca->pd->ib_pd, &qp_init_attr);
572         if (IS_ERR(ibqp)) {
573                 ehca_err(&shca->ib_device, "Cannot create AQP1 QP.");
574                 ret = PTR_ERR(ibqp);
575                 goto create_aqp1;
576         }
577         sport->ibqp_sqp[IB_QPT_GSI] = ibqp;
578
579         return 0;
580
581 create_aqp1:
582         ib_destroy_cq(sport->ibcq_aqp1);
583         return ret;
584 }
585
586 static int ehca_destroy_aqp1(struct ehca_sport *sport)
587 {
588         int ret;
589
590         ret = ib_destroy_qp(sport->ibqp_sqp[IB_QPT_GSI]);
591         if (ret) {
592                 ehca_gen_err("Cannot destroy AQP1 QP. ret=%i", ret);
593                 return ret;
594         }
595
596         ret = ib_destroy_cq(sport->ibcq_aqp1);
597         if (ret)
598                 ehca_gen_err("Cannot destroy AQP1 CQ. ret=%i", ret);
599
600         return ret;
601 }
602
603 static ssize_t ehca_show_debug_level(struct device_driver *ddp, char *buf)
604 {
605         return snprintf(buf, PAGE_SIZE, "%d\n", ehca_debug_level);
606 }
607
608 static ssize_t ehca_store_debug_level(struct device_driver *ddp,
609                                       const char *buf, size_t count)
610 {
611         int value = (*buf) - '0';
612         if (value >= 0 && value <= 9)
613                 ehca_debug_level = value;
614         return 1;
615 }
616
617 static DRIVER_ATTR(debug_level, S_IRUSR | S_IWUSR,
618                    ehca_show_debug_level, ehca_store_debug_level);
619
620 static struct attribute *ehca_drv_attrs[] = {
621         &driver_attr_debug_level.attr,
622         NULL
623 };
624
625 static struct attribute_group ehca_drv_attr_grp = {
626         .attrs = ehca_drv_attrs
627 };
628
629 static const struct attribute_group *ehca_drv_attr_groups[] = {
630         &ehca_drv_attr_grp,
631         NULL,
632 };
633
634 #define EHCA_RESOURCE_ATTR(name)                                           \
635 static ssize_t  ehca_show_##name(struct device *dev,                       \
636                                  struct device_attribute *attr,            \
637                                  char *buf)                                \
638 {                                                                          \
639         struct ehca_shca *shca;                                            \
640         struct hipz_query_hca *rblock;                                     \
641         int data;                                                          \
642                                                                            \
643         shca = dev_get_drvdata(dev);                                       \
644                                                                            \
645         rblock = ehca_alloc_fw_ctrlblock(GFP_KERNEL);                      \
646         if (!rblock) {                                                     \
647                 dev_err(dev, "Can't allocate rblock memory.\n");           \
648                 return 0;                                                  \
649         }                                                                  \
650                                                                            \
651         if (hipz_h_query_hca(shca->ipz_hca_handle, rblock) != H_SUCCESS) { \
652                 dev_err(dev, "Can't query device properties\n");           \
653                 ehca_free_fw_ctrlblock(rblock);                            \
654                 return 0;                                                  \
655         }                                                                  \
656                                                                            \
657         data = rblock->name;                                               \
658         ehca_free_fw_ctrlblock(rblock);                                    \
659                                                                            \
660         if ((strcmp(#name, "num_ports") == 0) && (ehca_nr_ports == 1))     \
661                 return snprintf(buf, 256, "1\n");                          \
662         else                                                               \
663                 return snprintf(buf, 256, "%d\n", data);                   \
664                                                                            \
665 }                                                                          \
666 static DEVICE_ATTR(name, S_IRUGO, ehca_show_##name, NULL);
667
668 EHCA_RESOURCE_ATTR(num_ports);
669 EHCA_RESOURCE_ATTR(hw_ver);
670 EHCA_RESOURCE_ATTR(max_eq);
671 EHCA_RESOURCE_ATTR(cur_eq);
672 EHCA_RESOURCE_ATTR(max_cq);
673 EHCA_RESOURCE_ATTR(cur_cq);
674 EHCA_RESOURCE_ATTR(max_qp);
675 EHCA_RESOURCE_ATTR(cur_qp);
676 EHCA_RESOURCE_ATTR(max_mr);
677 EHCA_RESOURCE_ATTR(cur_mr);
678 EHCA_RESOURCE_ATTR(max_mw);
679 EHCA_RESOURCE_ATTR(cur_mw);
680 EHCA_RESOURCE_ATTR(max_pd);
681 EHCA_RESOURCE_ATTR(max_ah);
682
683 static ssize_t ehca_show_adapter_handle(struct device *dev,
684                                         struct device_attribute *attr,
685                                         char *buf)
686 {
687         struct ehca_shca *shca = dev_get_drvdata(dev);
688
689         return sprintf(buf, "%llx\n", shca->ipz_hca_handle.handle);
690
691 }
692 static DEVICE_ATTR(adapter_handle, S_IRUGO, ehca_show_adapter_handle, NULL);
693
694 static struct attribute *ehca_dev_attrs[] = {
695         &dev_attr_adapter_handle.attr,
696         &dev_attr_num_ports.attr,
697         &dev_attr_hw_ver.attr,
698         &dev_attr_max_eq.attr,
699         &dev_attr_cur_eq.attr,
700         &dev_attr_max_cq.attr,
701         &dev_attr_cur_cq.attr,
702         &dev_attr_max_qp.attr,
703         &dev_attr_cur_qp.attr,
704         &dev_attr_max_mr.attr,
705         &dev_attr_cur_mr.attr,
706         &dev_attr_max_mw.attr,
707         &dev_attr_cur_mw.attr,
708         &dev_attr_max_pd.attr,
709         &dev_attr_max_ah.attr,
710         NULL
711 };
712
713 static struct attribute_group ehca_dev_attr_grp = {
714         .attrs = ehca_dev_attrs
715 };
716
717 static int ehca_probe(struct platform_device *dev,
718                       const struct of_device_id *id)
719 {
720         struct ehca_shca *shca;
721         const u64 *handle;
722         struct ib_pd *ibpd;
723         int ret, i, eq_size;
724         unsigned long flags;
725
726         handle = of_get_property(dev->dev.of_node, "ibm,hca-handle", NULL);
727         if (!handle) {
728                 ehca_gen_err("Cannot get eHCA handle for adapter: %s.",
729                              dev->dev.of_node->full_name);
730                 return -ENODEV;
731         }
732
733         if (!(*handle)) {
734                 ehca_gen_err("Wrong eHCA handle for adapter: %s.",
735                              dev->dev.of_node->full_name);
736                 return -ENODEV;
737         }
738
739         shca = (struct ehca_shca *)ib_alloc_device(sizeof(*shca));
740         if (!shca) {
741                 ehca_gen_err("Cannot allocate shca memory.");
742                 return -ENOMEM;
743         }
744
745         mutex_init(&shca->modify_mutex);
746         atomic_set(&shca->num_cqs, 0);
747         atomic_set(&shca->num_qps, 0);
748         shca->max_num_qps = ehca_max_qp;
749         shca->max_num_cqs = ehca_max_cq;
750
751         for (i = 0; i < ARRAY_SIZE(shca->sport); i++)
752                 spin_lock_init(&shca->sport[i].mod_sqp_lock);
753
754         shca->ofdev = dev;
755         shca->ipz_hca_handle.handle = *handle;
756         dev_set_drvdata(&dev->dev, shca);
757
758         ret = ehca_sense_attributes(shca);
759         if (ret < 0) {
760                 ehca_gen_err("Cannot sense eHCA attributes.");
761                 goto probe1;
762         }
763
764         ret = ehca_init_device(shca);
765         if (ret) {
766                 ehca_gen_err("Cannot init ehca  device struct");
767                 goto probe1;
768         }
769
770         eq_size = 2 * shca->max_num_cqs + 4 * shca->max_num_qps;
771         /* create event queues */
772         ret = ehca_create_eq(shca, &shca->eq, EHCA_EQ, eq_size);
773         if (ret) {
774                 ehca_err(&shca->ib_device, "Cannot create EQ.");
775                 goto probe1;
776         }
777
778         ret = ehca_create_eq(shca, &shca->neq, EHCA_NEQ, 513);
779         if (ret) {
780                 ehca_err(&shca->ib_device, "Cannot create NEQ.");
781                 goto probe3;
782         }
783
784         /* create internal protection domain */
785         ibpd = ehca_alloc_pd(&shca->ib_device, (void *)(-1), NULL);
786         if (IS_ERR(ibpd)) {
787                 ehca_err(&shca->ib_device, "Cannot create internal PD.");
788                 ret = PTR_ERR(ibpd);
789                 goto probe4;
790         }
791
792         shca->pd = container_of(ibpd, struct ehca_pd, ib_pd);
793         shca->pd->ib_pd.device = &shca->ib_device;
794
795         /* create internal max MR */
796         ret = ehca_reg_internal_maxmr(shca, shca->pd, &shca->maxmr);
797
798         if (ret) {
799                 ehca_err(&shca->ib_device, "Cannot create internal MR ret=%i",
800                          ret);
801                 goto probe5;
802         }
803
804         ret = ib_register_device(&shca->ib_device, NULL);
805         if (ret) {
806                 ehca_err(&shca->ib_device,
807                          "ib_register_device() failed ret=%i", ret);
808                 goto probe6;
809         }
810
811         /* create AQP1 for port 1 */
812         if (ehca_open_aqp1 == 1) {
813                 shca->sport[0].port_state = IB_PORT_DOWN;
814                 ret = ehca_create_aqp1(shca, 1);
815                 if (ret) {
816                         ehca_err(&shca->ib_device,
817                                  "Cannot create AQP1 for port 1.");
818                         goto probe7;
819                 }
820         }
821
822         /* create AQP1 for port 2 */
823         if ((ehca_open_aqp1 == 1) && (shca->num_ports == 2)) {
824                 shca->sport[1].port_state = IB_PORT_DOWN;
825                 ret = ehca_create_aqp1(shca, 2);
826                 if (ret) {
827                         ehca_err(&shca->ib_device,
828                                  "Cannot create AQP1 for port 2.");
829                         goto probe8;
830                 }
831         }
832
833         ret = sysfs_create_group(&dev->dev.kobj, &ehca_dev_attr_grp);
834         if (ret) /* only complain; we can live without attributes */
835                 ehca_err(&shca->ib_device,
836                          "Cannot create device attributes  ret=%d", ret);
837
838         spin_lock_irqsave(&shca_list_lock, flags);
839         list_add(&shca->shca_list, &shca_list);
840         spin_unlock_irqrestore(&shca_list_lock, flags);
841
842         return 0;
843
844 probe8:
845         ret = ehca_destroy_aqp1(&shca->sport[0]);
846         if (ret)
847                 ehca_err(&shca->ib_device,
848                          "Cannot destroy AQP1 for port 1. ret=%i", ret);
849
850 probe7:
851         ib_unregister_device(&shca->ib_device);
852
853 probe6:
854         ret = ehca_dereg_internal_maxmr(shca);
855         if (ret)
856                 ehca_err(&shca->ib_device,
857                          "Cannot destroy internal MR. ret=%x", ret);
858
859 probe5:
860         ret = ehca_dealloc_pd(&shca->pd->ib_pd);
861         if (ret)
862                 ehca_err(&shca->ib_device,
863                          "Cannot destroy internal PD. ret=%x", ret);
864
865 probe4:
866         ret = ehca_destroy_eq(shca, &shca->neq);
867         if (ret)
868                 ehca_err(&shca->ib_device,
869                          "Cannot destroy NEQ. ret=%x", ret);
870
871 probe3:
872         ret = ehca_destroy_eq(shca, &shca->eq);
873         if (ret)
874                 ehca_err(&shca->ib_device,
875                          "Cannot destroy EQ. ret=%x", ret);
876
877 probe1:
878         ib_dealloc_device(&shca->ib_device);
879
880         return -EINVAL;
881 }
882
883 static int ehca_remove(struct platform_device *dev)
884 {
885         struct ehca_shca *shca = dev_get_drvdata(&dev->dev);
886         unsigned long flags;
887         int ret;
888
889         sysfs_remove_group(&dev->dev.kobj, &ehca_dev_attr_grp);
890
891         if (ehca_open_aqp1 == 1) {
892                 int i;
893                 for (i = 0; i < shca->num_ports; i++) {
894                         ret = ehca_destroy_aqp1(&shca->sport[i]);
895                         if (ret)
896                                 ehca_err(&shca->ib_device,
897                                          "Cannot destroy AQP1 for port %x "
898                                          "ret=%i", ret, i);
899                 }
900         }
901
902         ib_unregister_device(&shca->ib_device);
903
904         ret = ehca_dereg_internal_maxmr(shca);
905         if (ret)
906                 ehca_err(&shca->ib_device,
907                          "Cannot destroy internal MR. ret=%i", ret);
908
909         ret = ehca_dealloc_pd(&shca->pd->ib_pd);
910         if (ret)
911                 ehca_err(&shca->ib_device,
912                          "Cannot destroy internal PD. ret=%i", ret);
913
914         ret = ehca_destroy_eq(shca, &shca->eq);
915         if (ret)
916                 ehca_err(&shca->ib_device, "Cannot destroy EQ. ret=%i", ret);
917
918         ret = ehca_destroy_eq(shca, &shca->neq);
919         if (ret)
920                 ehca_err(&shca->ib_device, "Canot destroy NEQ. ret=%i", ret);
921
922         ib_dealloc_device(&shca->ib_device);
923
924         spin_lock_irqsave(&shca_list_lock, flags);
925         list_del(&shca->shca_list);
926         spin_unlock_irqrestore(&shca_list_lock, flags);
927
928         return ret;
929 }
930
931 static struct of_device_id ehca_device_table[] =
932 {
933         {
934                 .name       = "lhca",
935                 .compatible = "IBM,lhca",
936         },
937         {},
938 };
939 MODULE_DEVICE_TABLE(of, ehca_device_table);
940
941 static struct of_platform_driver ehca_driver = {
942         .probe       = ehca_probe,
943         .remove      = ehca_remove,
944         .driver = {
945                 .name = "ehca",
946                 .owner = THIS_MODULE,
947                 .groups = ehca_drv_attr_groups,
948                 .of_match_table = ehca_device_table,
949         },
950 };
951
952 void ehca_poll_eqs(unsigned long data)
953 {
954         struct ehca_shca *shca;
955
956         spin_lock(&shca_list_lock);
957         list_for_each_entry(shca, &shca_list, shca_list) {
958                 if (shca->eq.is_initialized) {
959                         /* call deadman proc only if eq ptr does not change */
960                         struct ehca_eq *eq = &shca->eq;
961                         int max = 3;
962                         volatile u64 q_ofs, q_ofs2;
963                         unsigned long flags;
964                         spin_lock_irqsave(&eq->spinlock, flags);
965                         q_ofs = eq->ipz_queue.current_q_offset;
966                         spin_unlock_irqrestore(&eq->spinlock, flags);
967                         do {
968                                 spin_lock_irqsave(&eq->spinlock, flags);
969                                 q_ofs2 = eq->ipz_queue.current_q_offset;
970                                 spin_unlock_irqrestore(&eq->spinlock, flags);
971                                 max--;
972                         } while (q_ofs == q_ofs2 && max > 0);
973                         if (q_ofs == q_ofs2)
974                                 ehca_process_eq(shca, 0);
975                 }
976         }
977         mod_timer(&poll_eqs_timer, round_jiffies(jiffies + HZ));
978         spin_unlock(&shca_list_lock);
979 }
980
981 static int ehca_mem_notifier(struct notifier_block *nb,
982                              unsigned long action, void *data)
983 {
984         static unsigned long ehca_dmem_warn_time;
985         unsigned long flags;
986
987         switch (action) {
988         case MEM_CANCEL_OFFLINE:
989         case MEM_CANCEL_ONLINE:
990         case MEM_ONLINE:
991         case MEM_OFFLINE:
992                 return NOTIFY_OK;
993         case MEM_GOING_ONLINE:
994         case MEM_GOING_OFFLINE:
995                 /* only ok if no hca is attached to the lpar */
996                 spin_lock_irqsave(&shca_list_lock, flags);
997                 if (list_empty(&shca_list)) {
998                         spin_unlock_irqrestore(&shca_list_lock, flags);
999                         return NOTIFY_OK;
1000                 } else {
1001                         spin_unlock_irqrestore(&shca_list_lock, flags);
1002                         if (printk_timed_ratelimit(&ehca_dmem_warn_time,
1003                                                    30 * 1000))
1004                                 ehca_gen_err("DMEM operations are not allowed"
1005                                              "in conjunction with eHCA");
1006                         return NOTIFY_BAD;
1007                 }
1008         }
1009         return NOTIFY_OK;
1010 }
1011
1012 static struct notifier_block ehca_mem_nb = {
1013         .notifier_call = ehca_mem_notifier,
1014 };
1015
1016 static int __init ehca_module_init(void)
1017 {
1018         int ret;
1019
1020         printk(KERN_INFO "eHCA Infiniband Device Driver "
1021                "(Version " HCAD_VERSION ")\n");
1022
1023         ret = ehca_create_comp_pool();
1024         if (ret) {
1025                 ehca_gen_err("Cannot create comp pool.");
1026                 return ret;
1027         }
1028
1029         ret = ehca_create_slab_caches();
1030         if (ret) {
1031                 ehca_gen_err("Cannot create SLAB caches");
1032                 ret = -ENOMEM;
1033                 goto module_init1;
1034         }
1035
1036         ret = ehca_create_busmap();
1037         if (ret) {
1038                 ehca_gen_err("Cannot create busmap.");
1039                 goto module_init2;
1040         }
1041
1042         ret = ibmebus_register_driver(&ehca_driver);
1043         if (ret) {
1044                 ehca_gen_err("Cannot register eHCA device driver");
1045                 ret = -EINVAL;
1046                 goto module_init3;
1047         }
1048
1049         ret = register_memory_notifier(&ehca_mem_nb);
1050         if (ret) {
1051                 ehca_gen_err("Failed registering memory add/remove notifier");
1052                 goto module_init4;
1053         }
1054
1055         if (ehca_poll_all_eqs != 1) {
1056                 ehca_gen_err("WARNING!!!");
1057                 ehca_gen_err("It is possible to lose interrupts.");
1058         } else {
1059                 init_timer(&poll_eqs_timer);
1060                 poll_eqs_timer.function = ehca_poll_eqs;
1061                 poll_eqs_timer.expires = jiffies + HZ;
1062                 add_timer(&poll_eqs_timer);
1063         }
1064
1065         return 0;
1066
1067 module_init4:
1068         ibmebus_unregister_driver(&ehca_driver);
1069
1070 module_init3:
1071         ehca_destroy_busmap();
1072
1073 module_init2:
1074         ehca_destroy_slab_caches();
1075
1076 module_init1:
1077         ehca_destroy_comp_pool();
1078         return ret;
1079 };
1080
1081 static void __exit ehca_module_exit(void)
1082 {
1083         if (ehca_poll_all_eqs == 1)
1084                 del_timer_sync(&poll_eqs_timer);
1085
1086         ibmebus_unregister_driver(&ehca_driver);
1087
1088         unregister_memory_notifier(&ehca_mem_nb);
1089
1090         ehca_destroy_busmap();
1091
1092         ehca_destroy_slab_caches();
1093
1094         ehca_destroy_comp_pool();
1095
1096         idr_destroy(&ehca_cq_idr);
1097         idr_destroy(&ehca_qp_idr);
1098 };
1099
1100 module_init(ehca_module_init);
1101 module_exit(ehca_module_exit);