linux/drivers/infiniband/hw/qib/qib_driver.c
<<
>>
Prefs
   1/*
   2 * Copyright (c) 2013 Intel Corporation. All rights reserved.
   3 * Copyright (c) 2006, 2007, 2008, 2009 QLogic Corporation. All rights reserved.
   4 * Copyright (c) 2003, 2004, 2005, 2006 PathScale, Inc. All rights reserved.
   5 *
   6 * This software is available to you under a choice of one of two
   7 * licenses.  You may choose to be licensed under the terms of the GNU
   8 * General Public License (GPL) Version 2, available from the file
   9 * COPYING in the main directory of this source tree, or the
  10 * OpenIB.org BSD license below:
  11 *
  12 *     Redistribution and use in source and binary forms, with or
  13 *     without modification, are permitted provided that the following
  14 *     conditions are met:
  15 *
  16 *      - Redistributions of source code must retain the above
  17 *        copyright notice, this list of conditions and the following
  18 *        disclaimer.
  19 *
  20 *      - Redistributions in binary form must reproduce the above
  21 *        copyright notice, this list of conditions and the following
  22 *        disclaimer in the documentation and/or other materials
  23 *        provided with the distribution.
  24 *
  25 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
  26 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
  27 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
  28 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
  29 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
  30 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
  31 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
  32 * SOFTWARE.
  33 */
  34
  35#include <linux/spinlock.h>
  36#include <linux/pci.h>
  37#include <linux/io.h>
  38#include <linux/delay.h>
  39#include <linux/netdevice.h>
  40#include <linux/vmalloc.h>
  41#include <linux/module.h>
  42#include <linux/prefetch.h>
  43
  44#include "qib.h"
  45
  46/*
  47 * The size has to be longer than this string, so we can append
  48 * board/chip information to it in the init code.
  49 */
  50const char ib_qib_version[] = QIB_DRIVER_VERSION "\n";
  51
  52DEFINE_SPINLOCK(qib_devs_lock);
  53LIST_HEAD(qib_dev_list);
  54DEFINE_MUTEX(qib_mutex);        /* general driver use */
  55
  56unsigned qib_ibmtu;
  57module_param_named(ibmtu, qib_ibmtu, uint, S_IRUGO);
  58MODULE_PARM_DESC(ibmtu, "Set max IB MTU (0=2KB, 1=256, 2=512, ... 5=4096");
  59
  60unsigned qib_compat_ddr_negotiate = 1;
  61module_param_named(compat_ddr_negotiate, qib_compat_ddr_negotiate, uint,
  62                   S_IWUSR | S_IRUGO);
  63MODULE_PARM_DESC(compat_ddr_negotiate,
  64                 "Attempt pre-IBTA 1.2 DDR speed negotiation");
  65
  66MODULE_LICENSE("Dual BSD/GPL");
  67MODULE_AUTHOR("Intel <ibsupport@intel.com>");
  68MODULE_DESCRIPTION("Intel IB driver");
  69MODULE_VERSION(QIB_DRIVER_VERSION);
  70
  71/*
  72 * QIB_PIO_MAXIBHDR is the max IB header size allowed for in our
  73 * PIO send buffers.  This is well beyond anything currently
  74 * defined in the InfiniBand spec.
  75 */
  76#define QIB_PIO_MAXIBHDR 128
  77
  78/*
  79 * QIB_MAX_PKT_RCV is the max # if packets processed per receive interrupt.
  80 */
  81#define QIB_MAX_PKT_RECV 64
  82
  83struct qlogic_ib_stats qib_stats;
  84
  85const char *qib_get_unit_name(int unit)
  86{
  87        static char iname[16];
  88
  89        snprintf(iname, sizeof(iname), "infinipath%u", unit);
  90        return iname;
  91}
  92
  93/*
  94 * Return count of units with at least one port ACTIVE.
  95 */
  96int qib_count_active_units(void)
  97{
  98        struct qib_devdata *dd;
  99        struct qib_pportdata *ppd;
 100        unsigned long flags;
 101        int pidx, nunits_active = 0;
 102
 103        spin_lock_irqsave(&qib_devs_lock, flags);
 104        list_for_each_entry(dd, &qib_dev_list, list) {
 105                if (!(dd->flags & QIB_PRESENT) || !dd->kregbase)
 106                        continue;
 107                for (pidx = 0; pidx < dd->num_pports; ++pidx) {
 108                        ppd = dd->pport + pidx;
 109                        if (ppd->lid && (ppd->lflags & (QIBL_LINKINIT |
 110                                         QIBL_LINKARMED | QIBL_LINKACTIVE))) {
 111                                nunits_active++;
 112                                break;
 113                        }
 114                }
 115        }
 116        spin_unlock_irqrestore(&qib_devs_lock, flags);
 117        return nunits_active;
 118}
 119
 120/*
 121 * Return count of all units, optionally return in arguments
 122 * the number of usable (present) units, and the number of
 123 * ports that are up.
 124 */
 125int qib_count_units(int *npresentp, int *nupp)
 126{
 127        int nunits = 0, npresent = 0, nup = 0;
 128        struct qib_devdata *dd;
 129        unsigned long flags;
 130        int pidx;
 131        struct qib_pportdata *ppd;
 132
 133        spin_lock_irqsave(&qib_devs_lock, flags);
 134
 135        list_for_each_entry(dd, &qib_dev_list, list) {
 136                nunits++;
 137                if ((dd->flags & QIB_PRESENT) && dd->kregbase)
 138                        npresent++;
 139                for (pidx = 0; pidx < dd->num_pports; ++pidx) {
 140                        ppd = dd->pport + pidx;
 141                        if (ppd->lid && (ppd->lflags & (QIBL_LINKINIT |
 142                                         QIBL_LINKARMED | QIBL_LINKACTIVE)))
 143                                nup++;
 144                }
 145        }
 146
 147        spin_unlock_irqrestore(&qib_devs_lock, flags);
 148
 149        if (npresentp)
 150                *npresentp = npresent;
 151        if (nupp)
 152                *nupp = nup;
 153
 154        return nunits;
 155}
 156
 157/**
 158 * qib_wait_linkstate - wait for an IB link state change to occur
 159 * @dd: the qlogic_ib device
 160 * @state: the state to wait for
 161 * @msecs: the number of milliseconds to wait
 162 *
 163 * wait up to msecs milliseconds for IB link state change to occur for
 164 * now, take the easy polling route.  Currently used only by
 165 * qib_set_linkstate.  Returns 0 if state reached, otherwise
 166 * -ETIMEDOUT state can have multiple states set, for any of several
 167 * transitions.
 168 */
 169int qib_wait_linkstate(struct qib_pportdata *ppd, u32 state, int msecs)
 170{
 171        int ret;
 172        unsigned long flags;
 173
 174        spin_lock_irqsave(&ppd->lflags_lock, flags);
 175        if (ppd->state_wanted) {
 176                spin_unlock_irqrestore(&ppd->lflags_lock, flags);
 177                ret = -EBUSY;
 178                goto bail;
 179        }
 180        ppd->state_wanted = state;
 181        spin_unlock_irqrestore(&ppd->lflags_lock, flags);
 182        wait_event_interruptible_timeout(ppd->state_wait,
 183                                         (ppd->lflags & state),
 184                                         msecs_to_jiffies(msecs));
 185        spin_lock_irqsave(&ppd->lflags_lock, flags);
 186        ppd->state_wanted = 0;
 187        spin_unlock_irqrestore(&ppd->lflags_lock, flags);
 188
 189        if (!(ppd->lflags & state))
 190                ret = -ETIMEDOUT;
 191        else
 192                ret = 0;
 193bail:
 194        return ret;
 195}
 196
 197int qib_set_linkstate(struct qib_pportdata *ppd, u8 newstate)
 198{
 199        u32 lstate;
 200        int ret;
 201        struct qib_devdata *dd = ppd->dd;
 202        unsigned long flags;
 203
 204        switch (newstate) {
 205        case QIB_IB_LINKDOWN_ONLY:
 206                dd->f_set_ib_cfg(ppd, QIB_IB_CFG_LSTATE,
 207                                 IB_LINKCMD_DOWN | IB_LINKINITCMD_NOP);
 208                /* don't wait */
 209                ret = 0;
 210                goto bail;
 211
 212        case QIB_IB_LINKDOWN:
 213                dd->f_set_ib_cfg(ppd, QIB_IB_CFG_LSTATE,
 214                                 IB_LINKCMD_DOWN | IB_LINKINITCMD_POLL);
 215                /* don't wait */
 216                ret = 0;
 217                goto bail;
 218
 219        case QIB_IB_LINKDOWN_SLEEP:
 220                dd->f_set_ib_cfg(ppd, QIB_IB_CFG_LSTATE,
 221                                 IB_LINKCMD_DOWN | IB_LINKINITCMD_SLEEP);
 222                /* don't wait */
 223                ret = 0;
 224                goto bail;
 225
 226        case QIB_IB_LINKDOWN_DISABLE:
 227                dd->f_set_ib_cfg(ppd, QIB_IB_CFG_LSTATE,
 228                                 IB_LINKCMD_DOWN | IB_LINKINITCMD_DISABLE);
 229                /* don't wait */
 230                ret = 0;
 231                goto bail;
 232
 233        case QIB_IB_LINKARM:
 234                if (ppd->lflags & QIBL_LINKARMED) {
 235                        ret = 0;
 236                        goto bail;
 237                }
 238                if (!(ppd->lflags & (QIBL_LINKINIT | QIBL_LINKACTIVE))) {
 239                        ret = -EINVAL;
 240                        goto bail;
 241                }
 242                /*
 243                 * Since the port can be ACTIVE when we ask for ARMED,
 244                 * clear QIBL_LINKV so we can wait for a transition.
 245                 * If the link isn't ARMED, then something else happened
 246                 * and there is no point waiting for ARMED.
 247                 */
 248                spin_lock_irqsave(&ppd->lflags_lock, flags);
 249                ppd->lflags &= ~QIBL_LINKV;
 250                spin_unlock_irqrestore(&ppd->lflags_lock, flags);
 251                dd->f_set_ib_cfg(ppd, QIB_IB_CFG_LSTATE,
 252                                 IB_LINKCMD_ARMED | IB_LINKINITCMD_NOP);
 253                lstate = QIBL_LINKV;
 254                break;
 255
 256        case QIB_IB_LINKACTIVE:
 257                if (ppd->lflags & QIBL_LINKACTIVE) {
 258                        ret = 0;
 259                        goto bail;
 260                }
 261                if (!(ppd->lflags & QIBL_LINKARMED)) {
 262                        ret = -EINVAL;
 263                        goto bail;
 264                }
 265                dd->f_set_ib_cfg(ppd, QIB_IB_CFG_LSTATE,
 266                                 IB_LINKCMD_ACTIVE | IB_LINKINITCMD_NOP);
 267                lstate = QIBL_LINKACTIVE;
 268                break;
 269
 270        default:
 271                ret = -EINVAL;
 272                goto bail;
 273        }
 274        ret = qib_wait_linkstate(ppd, lstate, 10);
 275
 276bail:
 277        return ret;
 278}
 279
 280/*
 281 * Get address of eager buffer from it's index (allocated in chunks, not
 282 * contiguous).
 283 */
 284static inline void *qib_get_egrbuf(const struct qib_ctxtdata *rcd, u32 etail)
 285{
 286        const u32 chunk = etail >> rcd->rcvegrbufs_perchunk_shift;
 287        const u32 idx =  etail & ((u32)rcd->rcvegrbufs_perchunk - 1);
 288
 289        return rcd->rcvegrbuf[chunk] + (idx << rcd->dd->rcvegrbufsize_shift);
 290}
 291
 292/*
 293 * Returns 1 if error was a CRC, else 0.
 294 * Needed for some chip's synthesized error counters.
 295 */
 296static u32 qib_rcv_hdrerr(struct qib_ctxtdata *rcd, struct qib_pportdata *ppd,
 297                          u32 ctxt, u32 eflags, u32 l, u32 etail,
 298                          __le32 *rhf_addr, struct qib_message_header *rhdr)
 299{
 300        u32 ret = 0;
 301
 302        if (eflags & (QLOGIC_IB_RHF_H_ICRCERR | QLOGIC_IB_RHF_H_VCRCERR))
 303                ret = 1;
 304        else if (eflags == QLOGIC_IB_RHF_H_TIDERR) {
 305                /* For TIDERR and RC QPs premptively schedule a NAK */
 306                struct qib_ib_header *hdr = (struct qib_ib_header *) rhdr;
 307                struct qib_other_headers *ohdr = NULL;
 308                struct qib_ibport *ibp = &ppd->ibport_data;
 309                struct qib_qp *qp = NULL;
 310                u32 tlen = qib_hdrget_length_in_bytes(rhf_addr);
 311                u16 lid  = be16_to_cpu(hdr->lrh[1]);
 312                int lnh = be16_to_cpu(hdr->lrh[0]) & 3;
 313                u32 qp_num;
 314                u32 opcode;
 315                u32 psn;
 316                int diff;
 317
 318                /* Sanity check packet */
 319                if (tlen < 24)
 320                        goto drop;
 321
 322                if (lid < QIB_MULTICAST_LID_BASE) {
 323                        lid &= ~((1 << ppd->lmc) - 1);
 324                        if (unlikely(lid != ppd->lid))
 325                                goto drop;
 326                }
 327
 328                /* Check for GRH */
 329                if (lnh == QIB_LRH_BTH)
 330                        ohdr = &hdr->u.oth;
 331                else if (lnh == QIB_LRH_GRH) {
 332                        u32 vtf;
 333
 334                        ohdr = &hdr->u.l.oth;
 335                        if (hdr->u.l.grh.next_hdr != IB_GRH_NEXT_HDR)
 336                                goto drop;
 337                        vtf = be32_to_cpu(hdr->u.l.grh.version_tclass_flow);
 338                        if ((vtf >> IB_GRH_VERSION_SHIFT) != IB_GRH_VERSION)
 339                                goto drop;
 340                } else
 341                        goto drop;
 342
 343                /* Get opcode and PSN from packet */
 344                opcode = be32_to_cpu(ohdr->bth[0]);
 345                opcode >>= 24;
 346                psn = be32_to_cpu(ohdr->bth[2]);
 347
 348                /* Get the destination QP number. */
 349                qp_num = be32_to_cpu(ohdr->bth[1]) & QIB_QPN_MASK;
 350                if (qp_num != QIB_MULTICAST_QPN) {
 351                        int ruc_res;
 352
 353                        qp = qib_lookup_qpn(ibp, qp_num);
 354                        if (!qp)
 355                                goto drop;
 356
 357                        /*
 358                         * Handle only RC QPs - for other QP types drop error
 359                         * packet.
 360                         */
 361                        spin_lock(&qp->r_lock);
 362
 363                        /* Check for valid receive state. */
 364                        if (!(ib_qib_state_ops[qp->state] &
 365                              QIB_PROCESS_RECV_OK)) {
 366                                ibp->n_pkt_drops++;
 367                                goto unlock;
 368                        }
 369
 370                        switch (qp->ibqp.qp_type) {
 371                        case IB_QPT_RC:
 372                                ruc_res =
 373                                        qib_ruc_check_hdr(
 374                                                ibp, hdr,
 375                                                lnh == QIB_LRH_GRH,
 376                                                qp,
 377                                                be32_to_cpu(ohdr->bth[0]));
 378                                if (ruc_res)
 379                                        goto unlock;
 380
 381                                /* Only deal with RDMA Writes for now */
 382                                if (opcode <
 383                                    IB_OPCODE_RC_RDMA_READ_RESPONSE_FIRST) {
 384                                        diff = qib_cmp24(psn, qp->r_psn);
 385                                        if (!qp->r_nak_state && diff >= 0) {
 386                                                ibp->n_rc_seqnak++;
 387                                                qp->r_nak_state =
 388                                                        IB_NAK_PSN_ERROR;
 389                                                /* Use the expected PSN. */
 390                                                qp->r_ack_psn = qp->r_psn;
 391                                                /*
 392                                                 * Wait to send the sequence
 393                                                 * NAK until all packets
 394                                                 * in the receive queue have
 395                                                 * been processed.
 396                                                 * Otherwise, we end up
 397                                                 * propagating congestion.
 398                                                 */
 399                                                if (list_empty(&qp->rspwait)) {
 400                                                        qp->r_flags |=
 401                                                                QIB_R_RSP_NAK;
 402                                                        atomic_inc(
 403                                                                &qp->refcount);
 404                                                        list_add_tail(
 405                                                         &qp->rspwait,
 406                                                         &rcd->qp_wait_list);
 407                                                }
 408                                        } /* Out of sequence NAK */
 409                                } /* QP Request NAKs */
 410                                break;
 411                        case IB_QPT_SMI:
 412                        case IB_QPT_GSI:
 413                        case IB_QPT_UD:
 414                        case IB_QPT_UC:
 415                        default:
 416                                /* For now don't handle any other QP types */
 417                                break;
 418                        }
 419
 420unlock:
 421                        spin_unlock(&qp->r_lock);
 422                        /*
 423                         * Notify qib_destroy_qp() if it is waiting
 424                         * for us to finish.
 425                         */
 426                        if (atomic_dec_and_test(&qp->refcount))
 427                                wake_up(&qp->wait);
 428                } /* Unicast QP */
 429        } /* Valid packet with TIDErr */
 430
 431drop:
 432        return ret;
 433}
 434
 435/*
 436 * qib_kreceive - receive a packet
 437 * @rcd: the qlogic_ib context
 438 * @llic: gets count of good packets needed to clear lli,
 439 *          (used with chips that need need to track crcs for lli)
 440 *
 441 * called from interrupt handler for errors or receive interrupt
 442 * Returns number of CRC error packets, needed by some chips for
 443 * local link integrity tracking.   crcs are adjusted down by following
 444 * good packets, if any, and count of good packets is also tracked.
 445 */
 446u32 qib_kreceive(struct qib_ctxtdata *rcd, u32 *llic, u32 *npkts)
 447{
 448        struct qib_devdata *dd = rcd->dd;
 449        struct qib_pportdata *ppd = rcd->ppd;
 450        __le32 *rhf_addr;
 451        void *ebuf;
 452        const u32 rsize = dd->rcvhdrentsize;        /* words */
 453        const u32 maxcnt = dd->rcvhdrcnt * rsize;   /* words */
 454        u32 etail = -1, l, hdrqtail;
 455        struct qib_message_header *hdr;
 456        u32 eflags, etype, tlen, i = 0, updegr = 0, crcs = 0;
 457        int last;
 458        u64 lval;
 459        struct qib_qp *qp, *nqp;
 460
 461        l = rcd->head;
 462        rhf_addr = (__le32 *) rcd->rcvhdrq + l + dd->rhf_offset;
 463        if (dd->flags & QIB_NODMA_RTAIL) {
 464                u32 seq = qib_hdrget_seq(rhf_addr);
 465
 466                if (seq != rcd->seq_cnt)
 467                        goto bail;
 468                hdrqtail = 0;
 469        } else {
 470                hdrqtail = qib_get_rcvhdrtail(rcd);
 471                if (l == hdrqtail)
 472                        goto bail;
 473                smp_rmb();  /* prevent speculative reads of dma'ed hdrq */
 474        }
 475
 476        for (last = 0, i = 1; !last; i += !last) {
 477                hdr = dd->f_get_msgheader(dd, rhf_addr);
 478                eflags = qib_hdrget_err_flags(rhf_addr);
 479                etype = qib_hdrget_rcv_type(rhf_addr);
 480                /* total length */
 481                tlen = qib_hdrget_length_in_bytes(rhf_addr);
 482                ebuf = NULL;
 483                if ((dd->flags & QIB_NODMA_RTAIL) ?
 484                    qib_hdrget_use_egr_buf(rhf_addr) :
 485                    (etype != RCVHQ_RCV_TYPE_EXPECTED)) {
 486                        etail = qib_hdrget_index(rhf_addr);
 487                        updegr = 1;
 488                        if (tlen > sizeof(*hdr) ||
 489                            etype >= RCVHQ_RCV_TYPE_NON_KD) {
 490                                ebuf = qib_get_egrbuf(rcd, etail);
 491                                prefetch_range(ebuf, tlen - sizeof(*hdr));
 492                        }
 493                }
 494                if (!eflags) {
 495                        u16 lrh_len = be16_to_cpu(hdr->lrh[2]) << 2;
 496
 497                        if (lrh_len != tlen) {
 498                                qib_stats.sps_lenerrs++;
 499                                goto move_along;
 500                        }
 501                }
 502                if (etype == RCVHQ_RCV_TYPE_NON_KD && !eflags &&
 503                    ebuf == NULL &&
 504                    tlen > (dd->rcvhdrentsize - 2 + 1 -
 505                                qib_hdrget_offset(rhf_addr)) << 2) {
 506                        goto move_along;
 507                }
 508
 509                /*
 510                 * Both tiderr and qibhdrerr are set for all plain IB
 511                 * packets; only qibhdrerr should be set.
 512                 */
 513                if (unlikely(eflags))
 514                        crcs += qib_rcv_hdrerr(rcd, ppd, rcd->ctxt, eflags, l,
 515                                               etail, rhf_addr, hdr);
 516                else if (etype == RCVHQ_RCV_TYPE_NON_KD) {
 517                        qib_ib_rcv(rcd, hdr, ebuf, tlen);
 518                        if (crcs)
 519                                crcs--;
 520                        else if (llic && *llic)
 521                                --*llic;
 522                }
 523move_along:
 524                l += rsize;
 525                if (l >= maxcnt)
 526                        l = 0;
 527                if (i == QIB_MAX_PKT_RECV)
 528                        last = 1;
 529
 530                rhf_addr = (__le32 *) rcd->rcvhdrq + l + dd->rhf_offset;
 531                if (dd->flags & QIB_NODMA_RTAIL) {
 532                        u32 seq = qib_hdrget_seq(rhf_addr);
 533
 534                        if (++rcd->seq_cnt > 13)
 535                                rcd->seq_cnt = 1;
 536                        if (seq != rcd->seq_cnt)
 537                                last = 1;
 538                } else if (l == hdrqtail)
 539                        last = 1;
 540                /*
 541                 * Update head regs etc., every 16 packets, if not last pkt,
 542                 * to help prevent rcvhdrq overflows, when many packets
 543                 * are processed and queue is nearly full.
 544                 * Don't request an interrupt for intermediate updates.
 545                 */
 546                lval = l;
 547                if (!last && !(i & 0xf)) {
 548                        dd->f_update_usrhead(rcd, lval, updegr, etail, i);
 549                        updegr = 0;
 550                }
 551        }
 552        /*
 553         * Notify qib_destroy_qp() if it is waiting
 554         * for lookaside_qp to finish.
 555         */
 556        if (rcd->lookaside_qp) {
 557                if (atomic_dec_and_test(&rcd->lookaside_qp->refcount))
 558                        wake_up(&rcd->lookaside_qp->wait);
 559                rcd->lookaside_qp = NULL;
 560        }
 561
 562        rcd->head = l;
 563
 564        /*
 565         * Iterate over all QPs waiting to respond.
 566         * The list won't change since the IRQ is only run on one CPU.
 567         */
 568        list_for_each_entry_safe(qp, nqp, &rcd->qp_wait_list, rspwait) {
 569                list_del_init(&qp->rspwait);
 570                if (qp->r_flags & QIB_R_RSP_NAK) {
 571                        qp->r_flags &= ~QIB_R_RSP_NAK;
 572                        qib_send_rc_ack(qp);
 573                }
 574                if (qp->r_flags & QIB_R_RSP_SEND) {
 575                        unsigned long flags;
 576
 577                        qp->r_flags &= ~QIB_R_RSP_SEND;
 578                        spin_lock_irqsave(&qp->s_lock, flags);
 579                        if (ib_qib_state_ops[qp->state] &
 580                                        QIB_PROCESS_OR_FLUSH_SEND)
 581                                qib_schedule_send(qp);
 582                        spin_unlock_irqrestore(&qp->s_lock, flags);
 583                }
 584                if (atomic_dec_and_test(&qp->refcount))
 585                        wake_up(&qp->wait);
 586        }
 587
 588bail:
 589        /* Report number of packets consumed */
 590        if (npkts)
 591                *npkts = i;
 592
 593        /*
 594         * Always write head at end, and setup rcv interrupt, even
 595         * if no packets were processed.
 596         */
 597        lval = (u64)rcd->head | dd->rhdrhead_intr_off;
 598        dd->f_update_usrhead(rcd, lval, updegr, etail, i);
 599        return crcs;
 600}
 601
 602/**
 603 * qib_set_mtu - set the MTU
 604 * @ppd: the perport data
 605 * @arg: the new MTU
 606 *
 607 * We can handle "any" incoming size, the issue here is whether we
 608 * need to restrict our outgoing size.   For now, we don't do any
 609 * sanity checking on this, and we don't deal with what happens to
 610 * programs that are already running when the size changes.
 611 * NOTE: changing the MTU will usually cause the IBC to go back to
 612 * link INIT state...
 613 */
 614int qib_set_mtu(struct qib_pportdata *ppd, u16 arg)
 615{
 616        u32 piosize;
 617        int ret, chk;
 618
 619        if (arg != 256 && arg != 512 && arg != 1024 && arg != 2048 &&
 620            arg != 4096) {
 621                ret = -EINVAL;
 622                goto bail;
 623        }
 624        chk = ib_mtu_enum_to_int(qib_ibmtu);
 625        if (chk > 0 && arg > chk) {
 626                ret = -EINVAL;
 627                goto bail;
 628        }
 629
 630        piosize = ppd->ibmaxlen;
 631        ppd->ibmtu = arg;
 632
 633        if (arg >= (piosize - QIB_PIO_MAXIBHDR)) {
 634                /* Only if it's not the initial value (or reset to it) */
 635                if (piosize != ppd->init_ibmaxlen) {
 636                        if (arg > piosize && arg <= ppd->init_ibmaxlen)
 637                                piosize = ppd->init_ibmaxlen - 2 * sizeof(u32);
 638                        ppd->ibmaxlen = piosize;
 639                }
 640        } else if ((arg + QIB_PIO_MAXIBHDR) != ppd->ibmaxlen) {
 641                piosize = arg + QIB_PIO_MAXIBHDR - 2 * sizeof(u32);
 642                ppd->ibmaxlen = piosize;
 643        }
 644
 645        ppd->dd->f_set_ib_cfg(ppd, QIB_IB_CFG_MTU, 0);
 646
 647        ret = 0;
 648
 649bail:
 650        return ret;
 651}
 652
 653int qib_set_lid(struct qib_pportdata *ppd, u32 lid, u8 lmc)
 654{
 655        struct qib_devdata *dd = ppd->dd;
 656
 657        ppd->lid = lid;
 658        ppd->lmc = lmc;
 659
 660        dd->f_set_ib_cfg(ppd, QIB_IB_CFG_LIDLMC,
 661                         lid | (~((1U << lmc) - 1)) << 16);
 662
 663        qib_devinfo(dd->pcidev, "IB%u:%u got a lid: 0x%x\n",
 664                    dd->unit, ppd->port, lid);
 665
 666        return 0;
 667}
 668
 669/*
 670 * Following deal with the "obviously simple" task of overriding the state
 671 * of the LEDS, which normally indicate link physical and logical status.
 672 * The complications arise in dealing with different hardware mappings
 673 * and the board-dependent routine being called from interrupts.
 674 * and then there's the requirement to _flash_ them.
 675 */
 676#define LED_OVER_FREQ_SHIFT 8
 677#define LED_OVER_FREQ_MASK (0xFF<<LED_OVER_FREQ_SHIFT)
 678/* Below is "non-zero" to force override, but both actual LEDs are off */
 679#define LED_OVER_BOTH_OFF (8)
 680
 681static void qib_run_led_override(unsigned long opaque)
 682{
 683        struct qib_pportdata *ppd = (struct qib_pportdata *)opaque;
 684        struct qib_devdata *dd = ppd->dd;
 685        int timeoff;
 686        int ph_idx;
 687
 688        if (!(dd->flags & QIB_INITTED))
 689                return;
 690
 691        ph_idx = ppd->led_override_phase++ & 1;
 692        ppd->led_override = ppd->led_override_vals[ph_idx];
 693        timeoff = ppd->led_override_timeoff;
 694
 695        dd->f_setextled(ppd, 1);
 696        /*
 697         * don't re-fire the timer if user asked for it to be off; we let
 698         * it fire one more time after they turn it off to simplify
 699         */
 700        if (ppd->led_override_vals[0] || ppd->led_override_vals[1])
 701                mod_timer(&ppd->led_override_timer, jiffies + timeoff);
 702}
 703
 704void qib_set_led_override(struct qib_pportdata *ppd, unsigned int val)
 705{
 706        struct qib_devdata *dd = ppd->dd;
 707        int timeoff, freq;
 708
 709        if (!(dd->flags & QIB_INITTED))
 710                return;
 711
 712        /* First check if we are blinking. If not, use 1HZ polling */
 713        timeoff = HZ;
 714        freq = (val & LED_OVER_FREQ_MASK) >> LED_OVER_FREQ_SHIFT;
 715
 716        if (freq) {
 717                /* For blink, set each phase from one nybble of val */
 718                ppd->led_override_vals[0] = val & 0xF;
 719                ppd->led_override_vals[1] = (val >> 4) & 0xF;
 720                timeoff = (HZ << 4)/freq;
 721        } else {
 722                /* Non-blink set both phases the same. */
 723                ppd->led_override_vals[0] = val & 0xF;
 724                ppd->led_override_vals[1] = val & 0xF;
 725        }
 726        ppd->led_override_timeoff = timeoff;
 727
 728        /*
 729         * If the timer has not already been started, do so. Use a "quick"
 730         * timeout so the function will be called soon, to look at our request.
 731         */
 732        if (atomic_inc_return(&ppd->led_override_timer_active) == 1) {
 733                /* Need to start timer */
 734                init_timer(&ppd->led_override_timer);
 735                ppd->led_override_timer.function = qib_run_led_override;
 736                ppd->led_override_timer.data = (unsigned long) ppd;
 737                ppd->led_override_timer.expires = jiffies + 1;
 738                add_timer(&ppd->led_override_timer);
 739        } else {
 740                if (ppd->led_override_vals[0] || ppd->led_override_vals[1])
 741                        mod_timer(&ppd->led_override_timer, jiffies + 1);
 742                atomic_dec(&ppd->led_override_timer_active);
 743        }
 744}
 745
 746/**
 747 * qib_reset_device - reset the chip if possible
 748 * @unit: the device to reset
 749 *
 750 * Whether or not reset is successful, we attempt to re-initialize the chip
 751 * (that is, much like a driver unload/reload).  We clear the INITTED flag
 752 * so that the various entry points will fail until we reinitialize.  For
 753 * now, we only allow this if no user contexts are open that use chip resources
 754 */
 755int qib_reset_device(int unit)
 756{
 757        int ret, i;
 758        struct qib_devdata *dd = qib_lookup(unit);
 759        struct qib_pportdata *ppd;
 760        unsigned long flags;
 761        int pidx;
 762
 763        if (!dd) {
 764                ret = -ENODEV;
 765                goto bail;
 766        }
 767
 768        qib_devinfo(dd->pcidev, "Reset on unit %u requested\n", unit);
 769
 770        if (!dd->kregbase || !(dd->flags & QIB_PRESENT)) {
 771                qib_devinfo(dd->pcidev,
 772                        "Invalid unit number %u or not initialized or not present\n",
 773                        unit);
 774                ret = -ENXIO;
 775                goto bail;
 776        }
 777
 778        spin_lock_irqsave(&dd->uctxt_lock, flags);
 779        if (dd->rcd)
 780                for (i = dd->first_user_ctxt; i < dd->cfgctxts; i++) {
 781                        if (!dd->rcd[i] || !dd->rcd[i]->cnt)
 782                                continue;
 783                        spin_unlock_irqrestore(&dd->uctxt_lock, flags);
 784                        ret = -EBUSY;
 785                        goto bail;
 786                }
 787        spin_unlock_irqrestore(&dd->uctxt_lock, flags);
 788
 789        for (pidx = 0; pidx < dd->num_pports; ++pidx) {
 790                ppd = dd->pport + pidx;
 791                if (atomic_read(&ppd->led_override_timer_active)) {
 792                        /* Need to stop LED timer, _then_ shut off LEDs */
 793                        del_timer_sync(&ppd->led_override_timer);
 794                        atomic_set(&ppd->led_override_timer_active, 0);
 795                }
 796
 797                /* Shut off LEDs after we are sure timer is not running */
 798                ppd->led_override = LED_OVER_BOTH_OFF;
 799                dd->f_setextled(ppd, 0);
 800                if (dd->flags & QIB_HAS_SEND_DMA)
 801                        qib_teardown_sdma(ppd);
 802        }
 803
 804        ret = dd->f_reset(dd);
 805        if (ret == 1)
 806                ret = qib_init(dd, 1);
 807        else
 808                ret = -EAGAIN;
 809        if (ret)
 810                qib_dev_err(dd,
 811                        "Reinitialize unit %u after reset failed with %d\n",
 812                        unit, ret);
 813        else
 814                qib_devinfo(dd->pcidev,
 815                        "Reinitialized unit %u after resetting\n",
 816                        unit);
 817
 818bail:
 819        return ret;
 820}
 821