linux/drivers/infiniband/hw/ehca/ehca_main.c
<<
>>
Prefs
   1/*
   2 *  IBM eServer eHCA Infiniband device driver for Linux on POWER
   3 *
   4 *  module start stop, hca detection
   5 *
   6 *  Authors: Heiko J Schick <schickhj@de.ibm.com>
   7 *           Hoang-Nam Nguyen <hnguyen@de.ibm.com>
   8 *           Joachim Fenkes <fenkes@de.ibm.com>
   9 *
  10 *  Copyright (c) 2005 IBM Corporation
  11 *
  12 *  All rights reserved.
  13 *
  14 *  This source code is distributed under a dual license of GPL v2.0 and OpenIB
  15 *  BSD.
  16 *
  17 * OpenIB BSD License
  18 *
  19 * Redistribution and use in source and binary forms, with or without
  20 * modification, are permitted provided that the following conditions are met:
  21 *
  22 * Redistributions of source code must retain the above copyright notice, this
  23 * list of conditions and the following disclaimer.
  24 *
  25 * Redistributions in binary form must reproduce the above copyright notice,
  26 * this list of conditions and the following disclaimer in the documentation
  27 * and/or other materials
  28 * provided with the distribution.
  29 *
  30 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
  31 * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  32 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  33 * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
  34 * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
  35 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
  36 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
  37 * BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER
  38 * IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
  39 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
  40 * POSSIBILITY OF SUCH DAMAGE.
  41 */
  42
  43#ifdef CONFIG_PPC_64K_PAGES
  44#include <linux/slab.h>
  45#endif
  46
  47#include <linux/notifier.h>
  48#include <linux/memory.h>
  49#include "ehca_classes.h"
  50#include "ehca_iverbs.h"
  51#include "ehca_mrmw.h"
  52#include "ehca_tools.h"
  53#include "hcp_if.h"
  54
  55#define HCAD_VERSION "0029"
  56
  57MODULE_LICENSE("Dual BSD/GPL");
  58MODULE_AUTHOR("Christoph Raisch <raisch@de.ibm.com>");
  59MODULE_DESCRIPTION("IBM eServer HCA InfiniBand Device Driver");
  60MODULE_VERSION(HCAD_VERSION);
  61
  62static int ehca_open_aqp1     = 0;
  63static int ehca_hw_level      = 0;
  64static int ehca_poll_all_eqs  = 1;
  65
  66int ehca_debug_level   = 0;
  67int ehca_nr_ports      = -1;
  68int ehca_use_hp_mr     = 0;
  69int ehca_port_act_time = 30;
  70int ehca_static_rate   = -1;
  71int ehca_scaling_code  = 0;
  72int ehca_lock_hcalls   = -1;
  73int ehca_max_cq        = -1;
  74int ehca_max_qp        = -1;
  75
  76module_param_named(open_aqp1,     ehca_open_aqp1,     bool, S_IRUGO);
  77module_param_named(debug_level,   ehca_debug_level,   int,  S_IRUGO);
  78module_param_named(hw_level,      ehca_hw_level,      int,  S_IRUGO);
  79module_param_named(nr_ports,      ehca_nr_ports,      int,  S_IRUGO);
  80module_param_named(use_hp_mr,     ehca_use_hp_mr,     bool, S_IRUGO);
  81module_param_named(port_act_time, ehca_port_act_time, int,  S_IRUGO);
  82module_param_named(poll_all_eqs,  ehca_poll_all_eqs,  bool, S_IRUGO);
  83module_param_named(static_rate,   ehca_static_rate,   int,  S_IRUGO);
  84module_param_named(scaling_code,  ehca_scaling_code,  bool, S_IRUGO);
  85module_param_named(lock_hcalls,   ehca_lock_hcalls,   bool, S_IRUGO);
  86module_param_named(number_of_cqs, ehca_max_cq,        int,  S_IRUGO);
  87module_param_named(number_of_qps, ehca_max_qp,        int,  S_IRUGO);
  88
  89MODULE_PARM_DESC(open_aqp1,
  90                 "Open AQP1 on startup (default: no)");
  91MODULE_PARM_DESC(debug_level,
  92                 "Amount of debug output (0: none (default), 1: traces, "
  93                 "2: some dumps, 3: lots)");
  94MODULE_PARM_DESC(hw_level,
  95                 "Hardware level (0: autosensing (default), "
  96                 "0x10..0x14: eHCA, 0x20..0x23: eHCA2)");
  97MODULE_PARM_DESC(nr_ports,
  98                 "number of connected ports (-1: autodetect (default), "
  99                 "1: port one only, 2: two ports)");
 100MODULE_PARM_DESC(use_hp_mr,
 101                 "Use high performance MRs (default: no)");
 102MODULE_PARM_DESC(port_act_time,
 103                 "Time to wait for port activation (default: 30 sec)");
 104MODULE_PARM_DESC(poll_all_eqs,
 105                 "Poll all event queues periodically (default: yes)");
 106MODULE_PARM_DESC(static_rate,
 107                 "Set permanent static rate (default: no static rate)");
 108MODULE_PARM_DESC(scaling_code,
 109                 "Enable scaling code (default: no)");
 110MODULE_PARM_DESC(lock_hcalls,
 111                 "Serialize all hCalls made by the driver "
 112                 "(default: autodetect)");
 113MODULE_PARM_DESC(number_of_cqs,
 114                "Max number of CQs which can be allocated "
 115                "(default: autodetect)");
 116MODULE_PARM_DESC(number_of_qps,
 117                "Max number of QPs which can be allocated "
 118                "(default: autodetect)");
 119
 120DEFINE_RWLOCK(ehca_qp_idr_lock);
 121DEFINE_RWLOCK(ehca_cq_idr_lock);
 122DEFINE_IDR(ehca_qp_idr);
 123DEFINE_IDR(ehca_cq_idr);
 124
 125static LIST_HEAD(shca_list); /* list of all registered ehcas */
 126static DEFINE_SPINLOCK(shca_list_lock);
 127
 128static struct timer_list poll_eqs_timer;
 129
 130#ifdef CONFIG_PPC_64K_PAGES
 131static struct kmem_cache *ctblk_cache;
 132
 133void *ehca_alloc_fw_ctrlblock(gfp_t flags)
 134{
 135        void *ret = kmem_cache_zalloc(ctblk_cache, flags);
 136        if (!ret)
 137                ehca_gen_err("Out of memory for ctblk");
 138        return ret;
 139}
 140
 141void ehca_free_fw_ctrlblock(void *ptr)
 142{
 143        if (ptr)
 144                kmem_cache_free(ctblk_cache, ptr);
 145
 146}
 147#endif
 148
 149int ehca2ib_return_code(u64 ehca_rc)
 150{
 151        switch (ehca_rc) {
 152        case H_SUCCESS:
 153                return 0;
 154        case H_RESOURCE:             /* Resource in use */
 155        case H_BUSY:
 156                return -EBUSY;
 157        case H_NOT_ENOUGH_RESOURCES: /* insufficient resources */
 158        case H_CONSTRAINED:          /* resource constraint */
 159        case H_NO_MEM:
 160                return -ENOMEM;
 161        default:
 162                return -EINVAL;
 163        }
 164}
 165
 166static int ehca_create_slab_caches(void)
 167{
 168        int ret;
 169
 170        ret = ehca_init_pd_cache();
 171        if (ret) {
 172                ehca_gen_err("Cannot create PD SLAB cache.");
 173                return ret;
 174        }
 175
 176        ret = ehca_init_cq_cache();
 177        if (ret) {
 178                ehca_gen_err("Cannot create CQ SLAB cache.");
 179                goto create_slab_caches2;
 180        }
 181
 182        ret = ehca_init_qp_cache();
 183        if (ret) {
 184                ehca_gen_err("Cannot create QP SLAB cache.");
 185                goto create_slab_caches3;
 186        }
 187
 188        ret = ehca_init_av_cache();
 189        if (ret) {
 190                ehca_gen_err("Cannot create AV SLAB cache.");
 191                goto create_slab_caches4;
 192        }
 193
 194        ret = ehca_init_mrmw_cache();
 195        if (ret) {
 196                ehca_gen_err("Cannot create MR&MW SLAB cache.");
 197                goto create_slab_caches5;
 198        }
 199
 200        ret = ehca_init_small_qp_cache();
 201        if (ret) {
 202                ehca_gen_err("Cannot create small queue SLAB cache.");
 203                goto create_slab_caches6;
 204        }
 205
 206#ifdef CONFIG_PPC_64K_PAGES
 207        ctblk_cache = kmem_cache_create("ehca_cache_ctblk",
 208                                        EHCA_PAGESIZE, H_CB_ALIGNMENT,
 209                                        SLAB_HWCACHE_ALIGN,
 210                                        NULL);
 211        if (!ctblk_cache) {
 212                ehca_gen_err("Cannot create ctblk SLAB cache.");
 213                ehca_cleanup_small_qp_cache();
 214                goto create_slab_caches6;
 215        }
 216#endif
 217        return 0;
 218
 219create_slab_caches6:
 220        ehca_cleanup_mrmw_cache();
 221
 222create_slab_caches5:
 223        ehca_cleanup_av_cache();
 224
 225create_slab_caches4:
 226        ehca_cleanup_qp_cache();
 227
 228create_slab_caches3:
 229        ehca_cleanup_cq_cache();
 230
 231create_slab_caches2:
 232        ehca_cleanup_pd_cache();
 233
 234        return ret;
 235}
 236
 237static void ehca_destroy_slab_caches(void)
 238{
 239        ehca_cleanup_small_qp_cache();
 240        ehca_cleanup_mrmw_cache();
 241        ehca_cleanup_av_cache();
 242        ehca_cleanup_qp_cache();
 243        ehca_cleanup_cq_cache();
 244        ehca_cleanup_pd_cache();
 245#ifdef CONFIG_PPC_64K_PAGES
 246        if (ctblk_cache)
 247                kmem_cache_destroy(ctblk_cache);
 248#endif
 249}
 250
 251#define EHCA_HCAAVER  EHCA_BMASK_IBM(32, 39)
 252#define EHCA_REVID    EHCA_BMASK_IBM(40, 63)
 253
 254static struct cap_descr {
 255        u64 mask;
 256        char *descr;
 257} hca_cap_descr[] = {
 258        { HCA_CAP_AH_PORT_NR_CHECK, "HCA_CAP_AH_PORT_NR_CHECK" },
 259        { HCA_CAP_ATOMIC, "HCA_CAP_ATOMIC" },
 260        { HCA_CAP_AUTO_PATH_MIG, "HCA_CAP_AUTO_PATH_MIG" },
 261        { HCA_CAP_BAD_P_KEY_CTR, "HCA_CAP_BAD_P_KEY_CTR" },
 262        { HCA_CAP_SQD_RTS_PORT_CHANGE, "HCA_CAP_SQD_RTS_PORT_CHANGE" },
 263        { HCA_CAP_CUR_QP_STATE_MOD, "HCA_CAP_CUR_QP_STATE_MOD" },
 264        { HCA_CAP_INIT_TYPE, "HCA_CAP_INIT_TYPE" },
 265        { HCA_CAP_PORT_ACTIVE_EVENT, "HCA_CAP_PORT_ACTIVE_EVENT" },
 266        { HCA_CAP_Q_KEY_VIOL_CTR, "HCA_CAP_Q_KEY_VIOL_CTR" },
 267        { HCA_CAP_WQE_RESIZE, "HCA_CAP_WQE_RESIZE" },
 268        { HCA_CAP_RAW_PACKET_MCAST, "HCA_CAP_RAW_PACKET_MCAST" },
 269        { HCA_CAP_SHUTDOWN_PORT, "HCA_CAP_SHUTDOWN_PORT" },
 270        { HCA_CAP_RC_LL_QP, "HCA_CAP_RC_LL_QP" },
 271        { HCA_CAP_SRQ, "HCA_CAP_SRQ" },
 272        { HCA_CAP_UD_LL_QP, "HCA_CAP_UD_LL_QP" },
 273        { HCA_CAP_RESIZE_MR, "HCA_CAP_RESIZE_MR" },
 274        { HCA_CAP_MINI_QP, "HCA_CAP_MINI_QP" },
 275        { HCA_CAP_H_ALLOC_RES_SYNC, "HCA_CAP_H_ALLOC_RES_SYNC" },
 276};
 277
 278static int ehca_sense_attributes(struct ehca_shca *shca)
 279{
 280        int i, ret = 0;
 281        u64 h_ret;
 282        struct hipz_query_hca *rblock;
 283        struct hipz_query_port *port;
 284        const char *loc_code;
 285
 286        static const u32 pgsize_map[] = {
 287                HCA_CAP_MR_PGSIZE_4K,  0x1000,
 288                HCA_CAP_MR_PGSIZE_64K, 0x10000,
 289                HCA_CAP_MR_PGSIZE_1M,  0x100000,
 290                HCA_CAP_MR_PGSIZE_16M, 0x1000000,
 291        };
 292
 293        ehca_gen_dbg("Probing adapter %s...",
 294                     shca->ofdev->node->full_name);
 295        loc_code = of_get_property(shca->ofdev->node, "ibm,loc-code", NULL);
 296        if (loc_code)
 297                ehca_gen_dbg(" ... location lode=%s", loc_code);
 298
 299        rblock = ehca_alloc_fw_ctrlblock(GFP_KERNEL);
 300        if (!rblock) {
 301                ehca_gen_err("Cannot allocate rblock memory.");
 302                return -ENOMEM;
 303        }
 304
 305        h_ret = hipz_h_query_hca(shca->ipz_hca_handle, rblock);
 306        if (h_ret != H_SUCCESS) {
 307                ehca_gen_err("Cannot query device properties. h_ret=%lli",
 308                             h_ret);
 309                ret = -EPERM;
 310                goto sense_attributes1;
 311        }
 312
 313        if (ehca_nr_ports == 1)
 314                shca->num_ports = 1;
 315        else
 316                shca->num_ports = (u8)rblock->num_ports;
 317
 318        ehca_gen_dbg(" ... found %x ports", rblock->num_ports);
 319
 320        if (ehca_hw_level == 0) {
 321                u32 hcaaver;
 322                u32 revid;
 323
 324                hcaaver = EHCA_BMASK_GET(EHCA_HCAAVER, rblock->hw_ver);
 325                revid   = EHCA_BMASK_GET(EHCA_REVID, rblock->hw_ver);
 326
 327                ehca_gen_dbg(" ... hardware version=%x:%x", hcaaver, revid);
 328
 329                if (hcaaver == 1) {
 330                        if (revid <= 3)
 331                                shca->hw_level = 0x10 | (revid + 1);
 332                        else
 333                                shca->hw_level = 0x14;
 334                } else if (hcaaver == 2) {
 335                        if (revid == 0)
 336                                shca->hw_level = 0x21;
 337                        else if (revid == 0x10)
 338                                shca->hw_level = 0x22;
 339                        else if (revid == 0x20 || revid == 0x21)
 340                                shca->hw_level = 0x23;
 341                }
 342
 343                if (!shca->hw_level) {
 344                        ehca_gen_warn("unknown hardware version"
 345                                      " - assuming default level");
 346                        shca->hw_level = 0x22;
 347                }
 348        } else
 349                shca->hw_level = ehca_hw_level;
 350        ehca_gen_dbg(" ... hardware level=%x", shca->hw_level);
 351
 352        shca->hca_cap = rblock->hca_cap_indicators;
 353        ehca_gen_dbg(" ... HCA capabilities:");
 354        for (i = 0; i < ARRAY_SIZE(hca_cap_descr); i++)
 355                if (EHCA_BMASK_GET(hca_cap_descr[i].mask, shca->hca_cap))
 356                        ehca_gen_dbg("   %s", hca_cap_descr[i].descr);
 357
 358        /* Autodetect hCall locking -- the "H_ALLOC_RESOURCE synced" flag is
 359         * a firmware property, so it's valid across all adapters
 360         */
 361        if (ehca_lock_hcalls == -1)
 362                ehca_lock_hcalls = !(shca->hca_cap & HCA_CAP_H_ALLOC_RES_SYNC);
 363
 364        /* translate supported MR page sizes; always support 4K */
 365        shca->hca_cap_mr_pgsize = EHCA_PAGESIZE;
 366        for (i = 0; i < ARRAY_SIZE(pgsize_map); i += 2)
 367                if (rblock->memory_page_size_supported & pgsize_map[i])
 368                        shca->hca_cap_mr_pgsize |= pgsize_map[i + 1];
 369
 370        /* Set maximum number of CQs and QPs to calculate EQ size */
 371        if (shca->max_num_qps == -1)
 372                shca->max_num_qps = min_t(int, rblock->max_qp,
 373                                          EHCA_MAX_NUM_QUEUES);
 374        else if (shca->max_num_qps < 1 || shca->max_num_qps > rblock->max_qp) {
 375                ehca_gen_warn("The requested number of QPs is out of range "
 376                              "(1 - %i) specified by HW. Value is set to %i",
 377                              rblock->max_qp, rblock->max_qp);
 378                shca->max_num_qps = rblock->max_qp;
 379        }
 380
 381        if (shca->max_num_cqs == -1)
 382                shca->max_num_cqs = min_t(int, rblock->max_cq,
 383                                          EHCA_MAX_NUM_QUEUES);
 384        else if (shca->max_num_cqs < 1 || shca->max_num_cqs > rblock->max_cq) {
 385                ehca_gen_warn("The requested number of CQs is out of range "
 386                              "(1 - %i) specified by HW. Value is set to %i",
 387                              rblock->max_cq, rblock->max_cq);
 388        }
 389
 390        /* query max MTU from first port -- it's the same for all ports */
 391        port = (struct hipz_query_port *)rblock;
 392        h_ret = hipz_h_query_port(shca->ipz_hca_handle, 1, port);
 393        if (h_ret != H_SUCCESS) {
 394                ehca_gen_err("Cannot query port properties. h_ret=%lli",
 395                             h_ret);
 396                ret = -EPERM;
 397                goto sense_attributes1;
 398        }
 399
 400        shca->max_mtu = port->max_mtu;
 401
 402sense_attributes1:
 403        ehca_free_fw_ctrlblock(rblock);
 404        return ret;
 405}
 406
 407static int init_node_guid(struct ehca_shca *shca)
 408{
 409        int ret = 0;
 410        struct hipz_query_hca *rblock;
 411
 412        rblock = ehca_alloc_fw_ctrlblock(GFP_KERNEL);
 413        if (!rblock) {
 414                ehca_err(&shca->ib_device, "Can't allocate rblock memory.");
 415                return -ENOMEM;
 416        }
 417
 418        if (hipz_h_query_hca(shca->ipz_hca_handle, rblock) != H_SUCCESS) {
 419                ehca_err(&shca->ib_device, "Can't query device properties");
 420                ret = -EINVAL;
 421                goto init_node_guid1;
 422        }
 423
 424        memcpy(&shca->ib_device.node_guid, &rblock->node_guid, sizeof(u64));
 425
 426init_node_guid1:
 427        ehca_free_fw_ctrlblock(rblock);
 428        return ret;
 429}
 430
 431static int ehca_init_device(struct ehca_shca *shca)
 432{
 433        int ret;
 434
 435        ret = init_node_guid(shca);
 436        if (ret)
 437                return ret;
 438
 439        strlcpy(shca->ib_device.name, "ehca%d", IB_DEVICE_NAME_MAX);
 440        shca->ib_device.owner               = THIS_MODULE;
 441
 442        shca->ib_device.uverbs_abi_ver      = 8;
 443        shca->ib_device.uverbs_cmd_mask     =
 444                (1ull << IB_USER_VERBS_CMD_GET_CONTEXT)         |
 445                (1ull << IB_USER_VERBS_CMD_QUERY_DEVICE)        |
 446                (1ull << IB_USER_VERBS_CMD_QUERY_PORT)          |
 447                (1ull << IB_USER_VERBS_CMD_ALLOC_PD)            |
 448                (1ull << IB_USER_VERBS_CMD_DEALLOC_PD)          |
 449                (1ull << IB_USER_VERBS_CMD_REG_MR)              |
 450                (1ull << IB_USER_VERBS_CMD_DEREG_MR)            |
 451                (1ull << IB_USER_VERBS_CMD_CREATE_COMP_CHANNEL) |
 452                (1ull << IB_USER_VERBS_CMD_CREATE_CQ)           |
 453                (1ull << IB_USER_VERBS_CMD_DESTROY_CQ)          |
 454                (1ull << IB_USER_VERBS_CMD_CREATE_QP)           |
 455                (1ull << IB_USER_VERBS_CMD_MODIFY_QP)           |
 456                (1ull << IB_USER_VERBS_CMD_QUERY_QP)            |
 457                (1ull << IB_USER_VERBS_CMD_DESTROY_QP)          |
 458                (1ull << IB_USER_VERBS_CMD_ATTACH_MCAST)        |
 459                (1ull << IB_USER_VERBS_CMD_DETACH_MCAST);
 460
 461        shca->ib_device.node_type           = RDMA_NODE_IB_CA;
 462        shca->ib_device.phys_port_cnt       = shca->num_ports;
 463        shca->ib_device.num_comp_vectors    = 1;
 464        shca->ib_device.dma_device          = &shca->ofdev->dev;
 465        shca->ib_device.query_device        = ehca_query_device;
 466        shca->ib_device.query_port          = ehca_query_port;
 467        shca->ib_device.query_gid           = ehca_query_gid;
 468        shca->ib_device.query_pkey          = ehca_query_pkey;
 469        /* shca->in_device.modify_device    = ehca_modify_device    */
 470        shca->ib_device.modify_port         = ehca_modify_port;
 471        shca->ib_device.alloc_ucontext      = ehca_alloc_ucontext;
 472        shca->ib_device.dealloc_ucontext    = ehca_dealloc_ucontext;
 473        shca->ib_device.alloc_pd            = ehca_alloc_pd;
 474        shca->ib_device.dealloc_pd          = ehca_dealloc_pd;
 475        shca->ib_device.create_ah           = ehca_create_ah;
 476        /* shca->ib_device.modify_ah        = ehca_modify_ah;       */
 477        shca->ib_device.query_ah            = ehca_query_ah;
 478        shca->ib_device.destroy_ah          = ehca_destroy_ah;
 479        shca->ib_device.create_qp           = ehca_create_qp;
 480        shca->ib_device.modify_qp           = ehca_modify_qp;
 481        shca->ib_device.query_qp            = ehca_query_qp;
 482        shca->ib_device.destroy_qp          = ehca_destroy_qp;
 483        shca->ib_device.post_send           = ehca_post_send;
 484        shca->ib_device.post_recv           = ehca_post_recv;
 485        shca->ib_device.create_cq           = ehca_create_cq;
 486        shca->ib_device.destroy_cq          = ehca_destroy_cq;
 487        shca->ib_device.resize_cq           = ehca_resize_cq;
 488        shca->ib_device.poll_cq             = ehca_poll_cq;
 489        /* shca->ib_device.peek_cq          = ehca_peek_cq;         */
 490        shca->ib_device.req_notify_cq       = ehca_req_notify_cq;
 491        /* shca->ib_device.req_ncomp_notif  = ehca_req_ncomp_notif; */
 492        shca->ib_device.get_dma_mr          = ehca_get_dma_mr;
 493        shca->ib_device.reg_phys_mr         = ehca_reg_phys_mr;
 494        shca->ib_device.reg_user_mr         = ehca_reg_user_mr;
 495        shca->ib_device.query_mr            = ehca_query_mr;
 496        shca->ib_device.dereg_mr            = ehca_dereg_mr;
 497        shca->ib_device.rereg_phys_mr       = ehca_rereg_phys_mr;
 498        shca->ib_device.alloc_mw            = ehca_alloc_mw;
 499        shca->ib_device.bind_mw             = ehca_bind_mw;
 500        shca->ib_device.dealloc_mw          = ehca_dealloc_mw;
 501        shca->ib_device.alloc_fmr           = ehca_alloc_fmr;
 502        shca->ib_device.map_phys_fmr        = ehca_map_phys_fmr;
 503        shca->ib_device.unmap_fmr           = ehca_unmap_fmr;
 504        shca->ib_device.dealloc_fmr         = ehca_dealloc_fmr;
 505        shca->ib_device.attach_mcast        = ehca_attach_mcast;
 506        shca->ib_device.detach_mcast        = ehca_detach_mcast;
 507        shca->ib_device.process_mad         = ehca_process_mad;
 508        shca->ib_device.mmap                = ehca_mmap;
 509        shca->ib_device.dma_ops             = &ehca_dma_mapping_ops;
 510
 511        if (EHCA_BMASK_GET(HCA_CAP_SRQ, shca->hca_cap)) {
 512                shca->ib_device.uverbs_cmd_mask |=
 513                        (1ull << IB_USER_VERBS_CMD_CREATE_SRQ) |
 514                        (1ull << IB_USER_VERBS_CMD_MODIFY_SRQ) |
 515                        (1ull << IB_USER_VERBS_CMD_QUERY_SRQ) |
 516                        (1ull << IB_USER_VERBS_CMD_DESTROY_SRQ);
 517
 518                shca->ib_device.create_srq          = ehca_create_srq;
 519                shca->ib_device.modify_srq          = ehca_modify_srq;
 520                shca->ib_device.query_srq           = ehca_query_srq;
 521                shca->ib_device.destroy_srq         = ehca_destroy_srq;
 522                shca->ib_device.post_srq_recv       = ehca_post_srq_recv;
 523        }
 524
 525        return ret;
 526}
 527
 528static int ehca_create_aqp1(struct ehca_shca *shca, u32 port)
 529{
 530        struct ehca_sport *sport = &shca->sport[port - 1];
 531        struct ib_cq *ibcq;
 532        struct ib_qp *ibqp;
 533        struct ib_qp_init_attr qp_init_attr;
 534        int ret;
 535
 536        if (sport->ibcq_aqp1) {
 537                ehca_err(&shca->ib_device, "AQP1 CQ is already created.");
 538                return -EPERM;
 539        }
 540
 541        ibcq = ib_create_cq(&shca->ib_device, NULL, NULL, (void *)(-1), 10, 0);
 542        if (IS_ERR(ibcq)) {
 543                ehca_err(&shca->ib_device, "Cannot create AQP1 CQ.");
 544                return PTR_ERR(ibcq);
 545        }
 546        sport->ibcq_aqp1 = ibcq;
 547
 548        if (sport->ibqp_sqp[IB_QPT_GSI]) {
 549                ehca_err(&shca->ib_device, "AQP1 QP is already created.");
 550                ret = -EPERM;
 551                goto create_aqp1;
 552        }
 553
 554        memset(&qp_init_attr, 0, sizeof(struct ib_qp_init_attr));
 555        qp_init_attr.send_cq          = ibcq;
 556        qp_init_attr.recv_cq          = ibcq;
 557        qp_init_attr.sq_sig_type      = IB_SIGNAL_ALL_WR;
 558        qp_init_attr.cap.max_send_wr  = 100;
 559        qp_init_attr.cap.max_recv_wr  = 100;
 560        qp_init_attr.cap.max_send_sge = 2;
 561        qp_init_attr.cap.max_recv_sge = 1;
 562        qp_init_attr.qp_type          = IB_QPT_GSI;
 563        qp_init_attr.port_num         = port;
 564        qp_init_attr.qp_context       = NULL;
 565        qp_init_attr.event_handler    = NULL;
 566        qp_init_attr.srq              = NULL;
 567
 568        ibqp = ib_create_qp(&shca->pd->ib_pd, &qp_init_attr);
 569        if (IS_ERR(ibqp)) {
 570                ehca_err(&shca->ib_device, "Cannot create AQP1 QP.");
 571                ret = PTR_ERR(ibqp);
 572                goto create_aqp1;
 573        }
 574        sport->ibqp_sqp[IB_QPT_GSI] = ibqp;
 575
 576        return 0;
 577
 578create_aqp1:
 579        ib_destroy_cq(sport->ibcq_aqp1);
 580        return ret;
 581}
 582
 583static int ehca_destroy_aqp1(struct ehca_sport *sport)
 584{
 585        int ret;
 586
 587        ret = ib_destroy_qp(sport->ibqp_sqp[IB_QPT_GSI]);
 588        if (ret) {
 589                ehca_gen_err("Cannot destroy AQP1 QP. ret=%i", ret);
 590                return ret;
 591        }
 592
 593        ret = ib_destroy_cq(sport->ibcq_aqp1);
 594        if (ret)
 595                ehca_gen_err("Cannot destroy AQP1 CQ. ret=%i", ret);
 596
 597        return ret;
 598}
 599
 600static ssize_t ehca_show_debug_level(struct device_driver *ddp, char *buf)
 601{
 602        return snprintf(buf, PAGE_SIZE, "%d\n", ehca_debug_level);
 603}
 604
 605static ssize_t ehca_store_debug_level(struct device_driver *ddp,
 606                                      const char *buf, size_t count)
 607{
 608        int value = (*buf) - '0';
 609        if (value >= 0 && value <= 9)
 610                ehca_debug_level = value;
 611        return 1;
 612}
 613
 614static DRIVER_ATTR(debug_level, S_IRUSR | S_IWUSR,
 615                   ehca_show_debug_level, ehca_store_debug_level);
 616
 617static struct attribute *ehca_drv_attrs[] = {
 618        &driver_attr_debug_level.attr,
 619        NULL
 620};
 621
 622static struct attribute_group ehca_drv_attr_grp = {
 623        .attrs = ehca_drv_attrs
 624};
 625
 626static const struct attribute_group *ehca_drv_attr_groups[] = {
 627        &ehca_drv_attr_grp,
 628        NULL,
 629};
 630
 631#define EHCA_RESOURCE_ATTR(name)                                           \
 632static ssize_t  ehca_show_##name(struct device *dev,                       \
 633                                 struct device_attribute *attr,            \
 634                                 char *buf)                                \
 635{                                                                          \
 636        struct ehca_shca *shca;                                            \
 637        struct hipz_query_hca *rblock;                                     \
 638        int data;                                                          \
 639                                                                           \
 640        shca = dev_get_drvdata(dev);                                       \
 641                                                                           \
 642        rblock = ehca_alloc_fw_ctrlblock(GFP_KERNEL);                      \
 643        if (!rblock) {                                                     \
 644                dev_err(dev, "Can't allocate rblock memory.\n");           \
 645                return 0;                                                  \
 646        }                                                                  \
 647                                                                           \
 648        if (hipz_h_query_hca(shca->ipz_hca_handle, rblock) != H_SUCCESS) { \
 649                dev_err(dev, "Can't query device properties\n");           \
 650                ehca_free_fw_ctrlblock(rblock);                            \
 651                return 0;                                                  \
 652        }                                                                  \
 653                                                                           \
 654        data = rblock->name;                                               \
 655        ehca_free_fw_ctrlblock(rblock);                                    \
 656                                                                           \
 657        if ((strcmp(#name, "num_ports") == 0) && (ehca_nr_ports == 1))     \
 658                return snprintf(buf, 256, "1\n");                          \
 659        else                                                               \
 660                return snprintf(buf, 256, "%d\n", data);                   \
 661                                                                           \
 662}                                                                          \
 663static DEVICE_ATTR(name, S_IRUGO, ehca_show_##name, NULL);
 664
 665EHCA_RESOURCE_ATTR(num_ports);
 666EHCA_RESOURCE_ATTR(hw_ver);
 667EHCA_RESOURCE_ATTR(max_eq);
 668EHCA_RESOURCE_ATTR(cur_eq);
 669EHCA_RESOURCE_ATTR(max_cq);
 670EHCA_RESOURCE_ATTR(cur_cq);
 671EHCA_RESOURCE_ATTR(max_qp);
 672EHCA_RESOURCE_ATTR(cur_qp);
 673EHCA_RESOURCE_ATTR(max_mr);
 674EHCA_RESOURCE_ATTR(cur_mr);
 675EHCA_RESOURCE_ATTR(max_mw);
 676EHCA_RESOURCE_ATTR(cur_mw);
 677EHCA_RESOURCE_ATTR(max_pd);
 678EHCA_RESOURCE_ATTR(max_ah);
 679
 680static ssize_t ehca_show_adapter_handle(struct device *dev,
 681                                        struct device_attribute *attr,
 682                                        char *buf)
 683{
 684        struct ehca_shca *shca = dev_get_drvdata(dev);
 685
 686        return sprintf(buf, "%llx\n", shca->ipz_hca_handle.handle);
 687
 688}
 689static DEVICE_ATTR(adapter_handle, S_IRUGO, ehca_show_adapter_handle, NULL);
 690
 691static struct attribute *ehca_dev_attrs[] = {
 692        &dev_attr_adapter_handle.attr,
 693        &dev_attr_num_ports.attr,
 694        &dev_attr_hw_ver.attr,
 695        &dev_attr_max_eq.attr,
 696        &dev_attr_cur_eq.attr,
 697        &dev_attr_max_cq.attr,
 698        &dev_attr_cur_cq.attr,
 699        &dev_attr_max_qp.attr,
 700        &dev_attr_cur_qp.attr,
 701        &dev_attr_max_mr.attr,
 702        &dev_attr_cur_mr.attr,
 703        &dev_attr_max_mw.attr,
 704        &dev_attr_cur_mw.attr,
 705        &dev_attr_max_pd.attr,
 706        &dev_attr_max_ah.attr,
 707        NULL
 708};
 709
 710static struct attribute_group ehca_dev_attr_grp = {
 711        .attrs = ehca_dev_attrs
 712};
 713
 714static int __devinit ehca_probe(struct of_device *dev,
 715                                const struct of_device_id *id)
 716{
 717        struct ehca_shca *shca;
 718        const u64 *handle;
 719        struct ib_pd *ibpd;
 720        int ret, i, eq_size;
 721        unsigned long flags;
 722
 723        handle = of_get_property(dev->node, "ibm,hca-handle", NULL);
 724        if (!handle) {
 725                ehca_gen_err("Cannot get eHCA handle for adapter: %s.",
 726                             dev->node->full_name);
 727                return -ENODEV;
 728        }
 729
 730        if (!(*handle)) {
 731                ehca_gen_err("Wrong eHCA handle for adapter: %s.",
 732                             dev->node->full_name);
 733                return -ENODEV;
 734        }
 735
 736        shca = (struct ehca_shca *)ib_alloc_device(sizeof(*shca));
 737        if (!shca) {
 738                ehca_gen_err("Cannot allocate shca memory.");
 739                return -ENOMEM;
 740        }
 741
 742        mutex_init(&shca->modify_mutex);
 743        atomic_set(&shca->num_cqs, 0);
 744        atomic_set(&shca->num_qps, 0);
 745        shca->max_num_qps = ehca_max_qp;
 746        shca->max_num_cqs = ehca_max_cq;
 747
 748        for (i = 0; i < ARRAY_SIZE(shca->sport); i++)
 749                spin_lock_init(&shca->sport[i].mod_sqp_lock);
 750
 751        shca->ofdev = dev;
 752        shca->ipz_hca_handle.handle = *handle;
 753        dev_set_drvdata(&dev->dev, shca);
 754
 755        ret = ehca_sense_attributes(shca);
 756        if (ret < 0) {
 757                ehca_gen_err("Cannot sense eHCA attributes.");
 758                goto probe1;
 759        }
 760
 761        ret = ehca_init_device(shca);
 762        if (ret) {
 763                ehca_gen_err("Cannot init ehca  device struct");
 764                goto probe1;
 765        }
 766
 767        eq_size = 2 * shca->max_num_cqs + 4 * shca->max_num_qps;
 768        /* create event queues */
 769        ret = ehca_create_eq(shca, &shca->eq, EHCA_EQ, eq_size);
 770        if (ret) {
 771                ehca_err(&shca->ib_device, "Cannot create EQ.");
 772                goto probe1;
 773        }
 774
 775        ret = ehca_create_eq(shca, &shca->neq, EHCA_NEQ, 513);
 776        if (ret) {
 777                ehca_err(&shca->ib_device, "Cannot create NEQ.");
 778                goto probe3;
 779        }
 780
 781        /* create internal protection domain */
 782        ibpd = ehca_alloc_pd(&shca->ib_device, (void *)(-1), NULL);
 783        if (IS_ERR(ibpd)) {
 784                ehca_err(&shca->ib_device, "Cannot create internal PD.");
 785                ret = PTR_ERR(ibpd);
 786                goto probe4;
 787        }
 788
 789        shca->pd = container_of(ibpd, struct ehca_pd, ib_pd);
 790        shca->pd->ib_pd.device = &shca->ib_device;
 791
 792        /* create internal max MR */
 793        ret = ehca_reg_internal_maxmr(shca, shca->pd, &shca->maxmr);
 794
 795        if (ret) {
 796                ehca_err(&shca->ib_device, "Cannot create internal MR ret=%i",
 797                         ret);
 798                goto probe5;
 799        }
 800
 801        ret = ib_register_device(&shca->ib_device);
 802        if (ret) {
 803                ehca_err(&shca->ib_device,
 804                         "ib_register_device() failed ret=%i", ret);
 805                goto probe6;
 806        }
 807
 808        /* create AQP1 for port 1 */
 809        if (ehca_open_aqp1 == 1) {
 810                shca->sport[0].port_state = IB_PORT_DOWN;
 811                ret = ehca_create_aqp1(shca, 1);
 812                if (ret) {
 813                        ehca_err(&shca->ib_device,
 814                                 "Cannot create AQP1 for port 1.");
 815                        goto probe7;
 816                }
 817        }
 818
 819        /* create AQP1 for port 2 */
 820        if ((ehca_open_aqp1 == 1) && (shca->num_ports == 2)) {
 821                shca->sport[1].port_state = IB_PORT_DOWN;
 822                ret = ehca_create_aqp1(shca, 2);
 823                if (ret) {
 824                        ehca_err(&shca->ib_device,
 825                                 "Cannot create AQP1 for port 2.");
 826                        goto probe8;
 827                }
 828        }
 829
 830        ret = sysfs_create_group(&dev->dev.kobj, &ehca_dev_attr_grp);
 831        if (ret) /* only complain; we can live without attributes */
 832                ehca_err(&shca->ib_device,
 833                         "Cannot create device attributes  ret=%d", ret);
 834
 835        spin_lock_irqsave(&shca_list_lock, flags);
 836        list_add(&shca->shca_list, &shca_list);
 837        spin_unlock_irqrestore(&shca_list_lock, flags);
 838
 839        return 0;
 840
 841probe8:
 842        ret = ehca_destroy_aqp1(&shca->sport[0]);
 843        if (ret)
 844                ehca_err(&shca->ib_device,
 845                         "Cannot destroy AQP1 for port 1. ret=%i", ret);
 846
 847probe7:
 848        ib_unregister_device(&shca->ib_device);
 849
 850probe6:
 851        ret = ehca_dereg_internal_maxmr(shca);
 852        if (ret)
 853                ehca_err(&shca->ib_device,
 854                         "Cannot destroy internal MR. ret=%x", ret);
 855
 856probe5:
 857        ret = ehca_dealloc_pd(&shca->pd->ib_pd);
 858        if (ret)
 859                ehca_err(&shca->ib_device,
 860                         "Cannot destroy internal PD. ret=%x", ret);
 861
 862probe4:
 863        ret = ehca_destroy_eq(shca, &shca->neq);
 864        if (ret)
 865                ehca_err(&shca->ib_device,
 866                         "Cannot destroy NEQ. ret=%x", ret);
 867
 868probe3:
 869        ret = ehca_destroy_eq(shca, &shca->eq);
 870        if (ret)
 871                ehca_err(&shca->ib_device,
 872                         "Cannot destroy EQ. ret=%x", ret);
 873
 874probe1:
 875        ib_dealloc_device(&shca->ib_device);
 876
 877        return -EINVAL;
 878}
 879
 880static int __devexit ehca_remove(struct of_device *dev)
 881{
 882        struct ehca_shca *shca = dev_get_drvdata(&dev->dev);
 883        unsigned long flags;
 884        int ret;
 885
 886        sysfs_remove_group(&dev->dev.kobj, &ehca_dev_attr_grp);
 887
 888        if (ehca_open_aqp1 == 1) {
 889                int i;
 890                for (i = 0; i < shca->num_ports; i++) {
 891                        ret = ehca_destroy_aqp1(&shca->sport[i]);
 892                        if (ret)
 893                                ehca_err(&shca->ib_device,
 894                                         "Cannot destroy AQP1 for port %x "
 895                                         "ret=%i", ret, i);
 896                }
 897        }
 898
 899        ib_unregister_device(&shca->ib_device);
 900
 901        ret = ehca_dereg_internal_maxmr(shca);
 902        if (ret)
 903                ehca_err(&shca->ib_device,
 904                         "Cannot destroy internal MR. ret=%i", ret);
 905
 906        ret = ehca_dealloc_pd(&shca->pd->ib_pd);
 907        if (ret)
 908                ehca_err(&shca->ib_device,
 909                         "Cannot destroy internal PD. ret=%i", ret);
 910
 911        ret = ehca_destroy_eq(shca, &shca->eq);
 912        if (ret)
 913                ehca_err(&shca->ib_device, "Cannot destroy EQ. ret=%i", ret);
 914
 915        ret = ehca_destroy_eq(shca, &shca->neq);
 916        if (ret)
 917                ehca_err(&shca->ib_device, "Canot destroy NEQ. ret=%i", ret);
 918
 919        ib_dealloc_device(&shca->ib_device);
 920
 921        spin_lock_irqsave(&shca_list_lock, flags);
 922        list_del(&shca->shca_list);
 923        spin_unlock_irqrestore(&shca_list_lock, flags);
 924
 925        return ret;
 926}
 927
 928static struct of_device_id ehca_device_table[] =
 929{
 930        {
 931                .name       = "lhca",
 932                .compatible = "IBM,lhca",
 933        },
 934        {},
 935};
 936MODULE_DEVICE_TABLE(of, ehca_device_table);
 937
 938static struct of_platform_driver ehca_driver = {
 939        .name        = "ehca",
 940        .match_table = ehca_device_table,
 941        .probe       = ehca_probe,
 942        .remove      = ehca_remove,
 943        .driver      = {
 944                .groups = ehca_drv_attr_groups,
 945        },
 946};
 947
 948void ehca_poll_eqs(unsigned long data)
 949{
 950        struct ehca_shca *shca;
 951
 952        spin_lock(&shca_list_lock);
 953        list_for_each_entry(shca, &shca_list, shca_list) {
 954                if (shca->eq.is_initialized) {
 955                        /* call deadman proc only if eq ptr does not change */
 956                        struct ehca_eq *eq = &shca->eq;
 957                        int max = 3;
 958                        volatile u64 q_ofs, q_ofs2;
 959                        unsigned long flags;
 960                        spin_lock_irqsave(&eq->spinlock, flags);
 961                        q_ofs = eq->ipz_queue.current_q_offset;
 962                        spin_unlock_irqrestore(&eq->spinlock, flags);
 963                        do {
 964                                spin_lock_irqsave(&eq->spinlock, flags);
 965                                q_ofs2 = eq->ipz_queue.current_q_offset;
 966                                spin_unlock_irqrestore(&eq->spinlock, flags);
 967                                max--;
 968                        } while (q_ofs == q_ofs2 && max > 0);
 969                        if (q_ofs == q_ofs2)
 970                                ehca_process_eq(shca, 0);
 971                }
 972        }
 973        mod_timer(&poll_eqs_timer, round_jiffies(jiffies + HZ));
 974        spin_unlock(&shca_list_lock);
 975}
 976
 977static int ehca_mem_notifier(struct notifier_block *nb,
 978                             unsigned long action, void *data)
 979{
 980        static unsigned long ehca_dmem_warn_time;
 981        unsigned long flags;
 982
 983        switch (action) {
 984        case MEM_CANCEL_OFFLINE:
 985        case MEM_CANCEL_ONLINE:
 986        case MEM_ONLINE:
 987        case MEM_OFFLINE:
 988                return NOTIFY_OK;
 989        case MEM_GOING_ONLINE:
 990        case MEM_GOING_OFFLINE:
 991                /* only ok if no hca is attached to the lpar */
 992                spin_lock_irqsave(&shca_list_lock, flags);
 993                if (list_empty(&shca_list)) {
 994                        spin_unlock_irqrestore(&shca_list_lock, flags);
 995                        return NOTIFY_OK;
 996                } else {
 997                        spin_unlock_irqrestore(&shca_list_lock, flags);
 998                        if (printk_timed_ratelimit(&ehca_dmem_warn_time,
 999                                                   30 * 1000))
1000                                ehca_gen_err("DMEM operations are not allowed"
1001                                             "in conjunction with eHCA");
1002                        return NOTIFY_BAD;
1003                }
1004        }
1005        return NOTIFY_OK;
1006}
1007
1008static struct notifier_block ehca_mem_nb = {
1009        .notifier_call = ehca_mem_notifier,
1010};
1011
1012static int __init ehca_module_init(void)
1013{
1014        int ret;
1015
1016        printk(KERN_INFO "eHCA Infiniband Device Driver "
1017               "(Version " HCAD_VERSION ")\n");
1018
1019        ret = ehca_create_comp_pool();
1020        if (ret) {
1021                ehca_gen_err("Cannot create comp pool.");
1022                return ret;
1023        }
1024
1025        ret = ehca_create_slab_caches();
1026        if (ret) {
1027                ehca_gen_err("Cannot create SLAB caches");
1028                ret = -ENOMEM;
1029                goto module_init1;
1030        }
1031
1032        ret = ehca_create_busmap();
1033        if (ret) {
1034                ehca_gen_err("Cannot create busmap.");
1035                goto module_init2;
1036        }
1037
1038        ret = ibmebus_register_driver(&ehca_driver);
1039        if (ret) {
1040                ehca_gen_err("Cannot register eHCA device driver");
1041                ret = -EINVAL;
1042                goto module_init3;
1043        }
1044
1045        ret = register_memory_notifier(&ehca_mem_nb);
1046        if (ret) {
1047                ehca_gen_err("Failed registering memory add/remove notifier");
1048                goto module_init4;
1049        }
1050
1051        if (ehca_poll_all_eqs != 1) {
1052                ehca_gen_err("WARNING!!!");
1053                ehca_gen_err("It is possible to lose interrupts.");
1054        } else {
1055                init_timer(&poll_eqs_timer);
1056                poll_eqs_timer.function = ehca_poll_eqs;
1057                poll_eqs_timer.expires = jiffies + HZ;
1058                add_timer(&poll_eqs_timer);
1059        }
1060
1061        return 0;
1062
1063module_init4:
1064        ibmebus_unregister_driver(&ehca_driver);
1065
1066module_init3:
1067        ehca_destroy_busmap();
1068
1069module_init2:
1070        ehca_destroy_slab_caches();
1071
1072module_init1:
1073        ehca_destroy_comp_pool();
1074        return ret;
1075};
1076
1077static void __exit ehca_module_exit(void)
1078{
1079        if (ehca_poll_all_eqs == 1)
1080                del_timer_sync(&poll_eqs_timer);
1081
1082        ibmebus_unregister_driver(&ehca_driver);
1083
1084        unregister_memory_notifier(&ehca_mem_nb);
1085
1086        ehca_destroy_busmap();
1087
1088        ehca_destroy_slab_caches();
1089
1090        ehca_destroy_comp_pool();
1091
1092        idr_destroy(&ehca_cq_idr);
1093        idr_destroy(&ehca_qp_idr);
1094};
1095
1096module_init(ehca_module_init);
1097module_exit(ehca_module_exit);
1098