linux/drivers/scsi/ibmvscsi/ibmvscsi.c
<<
>>
Prefs
   1/* ------------------------------------------------------------
   2 * ibmvscsi.c
   3 * (C) Copyright IBM Corporation 1994, 2004
   4 * Authors: Colin DeVilbiss (devilbis@us.ibm.com)
   5 *          Santiago Leon (santil@us.ibm.com)
   6 *          Dave Boutcher (sleddog@us.ibm.com)
   7 *
   8 * This program is free software; you can redistribute it and/or modify
   9 * it under the terms of the GNU General Public License as published by
  10 * the Free Software Foundation; either version 2 of the License, or
  11 * (at your option) any later version.
  12 *
  13 * This program is distributed in the hope that it will be useful,
  14 * but WITHOUT ANY WARRANTY; without even the implied warranty of
  15 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
  16 * GNU General Public License for more details.
  17 *
  18 * You should have received a copy of the GNU General Public License
  19 * along with this program; if not, write to the Free Software
  20 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307
  21 * USA
  22 *
  23 * ------------------------------------------------------------
  24 * Emulation of a SCSI host adapter for Virtual I/O devices
  25 *
  26 * This driver supports the SCSI adapter implemented by the IBM
  27 * Power5 firmware.  That SCSI adapter is not a physical adapter,
  28 * but allows Linux SCSI peripheral drivers to directly
  29 * access devices in another logical partition on the physical system.
  30 *
  31 * The virtual adapter(s) are present in the open firmware device
  32 * tree just like real adapters.
  33 *
  34 * One of the capabilities provided on these systems is the ability
  35 * to DMA between partitions.  The architecture states that for VSCSI,
  36 * the server side is allowed to DMA to and from the client.  The client
  37 * is never trusted to DMA to or from the server directly.
  38 *
  39 * Messages are sent between partitions on a "Command/Response Queue" 
  40 * (CRQ), which is just a buffer of 16 byte entries in the receiver's 
  41 * Senders cannot access the buffer directly, but send messages by
  42 * making a hypervisor call and passing in the 16 bytes.  The hypervisor
  43 * puts the message in the next 16 byte space in round-robin fashion,
  44 * turns on the high order bit of the message (the valid bit), and 
  45 * generates an interrupt to the receiver (if interrupts are turned on.) 
  46 * The receiver just turns off the valid bit when they have copied out
  47 * the message.
  48 *
  49 * The VSCSI client builds a SCSI Remote Protocol (SRP) Information Unit
  50 * (IU) (as defined in the T10 standard available at www.t10.org), gets 
  51 * a DMA address for the message, and sends it to the server as the
  52 * payload of a CRQ message.  The server DMAs the SRP IU and processes it,
  53 * including doing any additional data transfers.  When it is done, it
  54 * DMAs the SRP response back to the same address as the request came from,
  55 * and sends a CRQ message back to inform the client that the request has
  56 * completed.
  57 *
  58 * TODO: This is currently pretty tied to the IBM pSeries hypervisor
  59 * interfaces.  It would be really nice to abstract this above an RDMA
  60 * layer.
  61 */
  62
  63#include <linux/module.h>
  64#include <linux/moduleparam.h>
  65#include <linux/dma-mapping.h>
  66#include <linux/delay.h>
  67#include <linux/slab.h>
  68#include <linux/of.h>
  69#include <linux/pm.h>
  70#include <linux/kthread.h>
  71#include <asm/firmware.h>
  72#include <asm/vio.h>
  73#include <scsi/scsi.h>
  74#include <scsi/scsi_cmnd.h>
  75#include <scsi/scsi_host.h>
  76#include <scsi/scsi_device.h>
  77#include <scsi/scsi_transport_srp.h>
  78#include "ibmvscsi.h"
  79
  80/* The values below are somewhat arbitrary default values, but 
  81 * OS/400 will use 3 busses (disks, CDs, tapes, I think.)
  82 * Note that there are 3 bits of channel value, 6 bits of id, and
  83 * 5 bits of LUN.
  84 */
  85static int max_id = 64;
  86static int max_channel = 3;
  87static int init_timeout = 300;
  88static int login_timeout = 60;
  89static int info_timeout = 30;
  90static int abort_timeout = 60;
  91static int reset_timeout = 60;
  92static int max_requests = IBMVSCSI_MAX_REQUESTS_DEFAULT;
  93static int max_events = IBMVSCSI_MAX_REQUESTS_DEFAULT + 2;
  94static int fast_fail = 1;
  95static int client_reserve = 1;
  96static char partition_name[97] = "UNKNOWN";
  97static unsigned int partition_number = -1;
  98
  99static struct scsi_transport_template *ibmvscsi_transport_template;
 100
 101#define IBMVSCSI_VERSION "1.5.9"
 102
 103MODULE_DESCRIPTION("IBM Virtual SCSI");
 104MODULE_AUTHOR("Dave Boutcher");
 105MODULE_LICENSE("GPL");
 106MODULE_VERSION(IBMVSCSI_VERSION);
 107
 108module_param_named(max_id, max_id, int, S_IRUGO | S_IWUSR);
 109MODULE_PARM_DESC(max_id, "Largest ID value for each channel");
 110module_param_named(max_channel, max_channel, int, S_IRUGO | S_IWUSR);
 111MODULE_PARM_DESC(max_channel, "Largest channel value");
 112module_param_named(init_timeout, init_timeout, int, S_IRUGO | S_IWUSR);
 113MODULE_PARM_DESC(init_timeout, "Initialization timeout in seconds");
 114module_param_named(max_requests, max_requests, int, S_IRUGO);
 115MODULE_PARM_DESC(max_requests, "Maximum requests for this adapter");
 116module_param_named(fast_fail, fast_fail, int, S_IRUGO | S_IWUSR);
 117MODULE_PARM_DESC(fast_fail, "Enable fast fail. [Default=1]");
 118module_param_named(client_reserve, client_reserve, int, S_IRUGO );
 119MODULE_PARM_DESC(client_reserve, "Attempt client managed reserve/release");
 120
 121static void ibmvscsi_handle_crq(struct viosrp_crq *crq,
 122                                struct ibmvscsi_host_data *hostdata);
 123
 124/* ------------------------------------------------------------
 125 * Routines for managing the command/response queue
 126 */
 127/**
 128 * ibmvscsi_handle_event: - Interrupt handler for crq events
 129 * @irq:        number of irq to handle, not used
 130 * @dev_instance: ibmvscsi_host_data of host that received interrupt
 131 *
 132 * Disables interrupts and schedules srp_task
 133 * Always returns IRQ_HANDLED
 134 */
 135static irqreturn_t ibmvscsi_handle_event(int irq, void *dev_instance)
 136{
 137        struct ibmvscsi_host_data *hostdata =
 138            (struct ibmvscsi_host_data *)dev_instance;
 139        vio_disable_interrupts(to_vio_dev(hostdata->dev));
 140        tasklet_schedule(&hostdata->srp_task);
 141        return IRQ_HANDLED;
 142}
 143
 144/**
 145 * release_crq_queue: - Deallocates data and unregisters CRQ
 146 * @queue:      crq_queue to initialize and register
 147 * @host_data:  ibmvscsi_host_data of host
 148 *
 149 * Frees irq, deallocates a page for messages, unmaps dma, and unregisters
 150 * the crq with the hypervisor.
 151 */
 152static void ibmvscsi_release_crq_queue(struct crq_queue *queue,
 153                                       struct ibmvscsi_host_data *hostdata,
 154                                       int max_requests)
 155{
 156        long rc = 0;
 157        struct vio_dev *vdev = to_vio_dev(hostdata->dev);
 158        free_irq(vdev->irq, (void *)hostdata);
 159        tasklet_kill(&hostdata->srp_task);
 160        do {
 161                if (rc)
 162                        msleep(100);
 163                rc = plpar_hcall_norets(H_FREE_CRQ, vdev->unit_address);
 164        } while ((rc == H_BUSY) || (H_IS_LONG_BUSY(rc)));
 165        dma_unmap_single(hostdata->dev,
 166                         queue->msg_token,
 167                         queue->size * sizeof(*queue->msgs), DMA_BIDIRECTIONAL);
 168        free_page((unsigned long)queue->msgs);
 169}
 170
 171/**
 172 * crq_queue_next_crq: - Returns the next entry in message queue
 173 * @queue:      crq_queue to use
 174 *
 175 * Returns pointer to next entry in queue, or NULL if there are no new
 176 * entried in the CRQ.
 177 */
 178static struct viosrp_crq *crq_queue_next_crq(struct crq_queue *queue)
 179{
 180        struct viosrp_crq *crq;
 181        unsigned long flags;
 182
 183        spin_lock_irqsave(&queue->lock, flags);
 184        crq = &queue->msgs[queue->cur];
 185        if (crq->valid & 0x80) {
 186                if (++queue->cur == queue->size)
 187                        queue->cur = 0;
 188        } else
 189                crq = NULL;
 190        spin_unlock_irqrestore(&queue->lock, flags);
 191
 192        return crq;
 193}
 194
 195/**
 196 * ibmvscsi_send_crq: - Send a CRQ
 197 * @hostdata:   the adapter
 198 * @word1:      the first 64 bits of the data
 199 * @word2:      the second 64 bits of the data
 200 */
 201static int ibmvscsi_send_crq(struct ibmvscsi_host_data *hostdata,
 202                             u64 word1, u64 word2)
 203{
 204        struct vio_dev *vdev = to_vio_dev(hostdata->dev);
 205
 206        return plpar_hcall_norets(H_SEND_CRQ, vdev->unit_address, word1, word2);
 207}
 208
 209/**
 210 * ibmvscsi_task: - Process srps asynchronously
 211 * @data:       ibmvscsi_host_data of host
 212 */
 213static void ibmvscsi_task(void *data)
 214{
 215        struct ibmvscsi_host_data *hostdata = (struct ibmvscsi_host_data *)data;
 216        struct vio_dev *vdev = to_vio_dev(hostdata->dev);
 217        struct viosrp_crq *crq;
 218        int done = 0;
 219
 220        while (!done) {
 221                /* Pull all the valid messages off the CRQ */
 222                while ((crq = crq_queue_next_crq(&hostdata->queue)) != NULL) {
 223                        ibmvscsi_handle_crq(crq, hostdata);
 224                        crq->valid = 0x00;
 225                }
 226
 227                vio_enable_interrupts(vdev);
 228                crq = crq_queue_next_crq(&hostdata->queue);
 229                if (crq != NULL) {
 230                        vio_disable_interrupts(vdev);
 231                        ibmvscsi_handle_crq(crq, hostdata);
 232                        crq->valid = 0x00;
 233                } else {
 234                        done = 1;
 235                }
 236        }
 237}
 238
 239static void gather_partition_info(void)
 240{
 241        struct device_node *rootdn;
 242
 243        const char *ppartition_name;
 244        const unsigned int *p_number_ptr;
 245
 246        /* Retrieve information about this partition */
 247        rootdn = of_find_node_by_path("/");
 248        if (!rootdn) {
 249                return;
 250        }
 251
 252        ppartition_name = of_get_property(rootdn, "ibm,partition-name", NULL);
 253        if (ppartition_name)
 254                strncpy(partition_name, ppartition_name,
 255                                sizeof(partition_name));
 256        p_number_ptr = of_get_property(rootdn, "ibm,partition-no", NULL);
 257        if (p_number_ptr)
 258                partition_number = *p_number_ptr;
 259        of_node_put(rootdn);
 260}
 261
 262static void set_adapter_info(struct ibmvscsi_host_data *hostdata)
 263{
 264        memset(&hostdata->madapter_info, 0x00,
 265                        sizeof(hostdata->madapter_info));
 266
 267        dev_info(hostdata->dev, "SRP_VERSION: %s\n", SRP_VERSION);
 268        strcpy(hostdata->madapter_info.srp_version, SRP_VERSION);
 269
 270        strncpy(hostdata->madapter_info.partition_name, partition_name,
 271                        sizeof(hostdata->madapter_info.partition_name));
 272
 273        hostdata->madapter_info.partition_number = partition_number;
 274
 275        hostdata->madapter_info.mad_version = 1;
 276        hostdata->madapter_info.os_type = 2;
 277}
 278
 279/**
 280 * reset_crq_queue: - resets a crq after a failure
 281 * @queue:      crq_queue to initialize and register
 282 * @hostdata:   ibmvscsi_host_data of host
 283 *
 284 */
 285static int ibmvscsi_reset_crq_queue(struct crq_queue *queue,
 286                                    struct ibmvscsi_host_data *hostdata)
 287{
 288        int rc = 0;
 289        struct vio_dev *vdev = to_vio_dev(hostdata->dev);
 290
 291        /* Close the CRQ */
 292        do {
 293                if (rc)
 294                        msleep(100);
 295                rc = plpar_hcall_norets(H_FREE_CRQ, vdev->unit_address);
 296        } while ((rc == H_BUSY) || (H_IS_LONG_BUSY(rc)));
 297
 298        /* Clean out the queue */
 299        memset(queue->msgs, 0x00, PAGE_SIZE);
 300        queue->cur = 0;
 301
 302        set_adapter_info(hostdata);
 303
 304        /* And re-open it again */
 305        rc = plpar_hcall_norets(H_REG_CRQ,
 306                                vdev->unit_address,
 307                                queue->msg_token, PAGE_SIZE);
 308        if (rc == 2) {
 309                /* Adapter is good, but other end is not ready */
 310                dev_warn(hostdata->dev, "Partner adapter not ready\n");
 311        } else if (rc != 0) {
 312                dev_warn(hostdata->dev, "couldn't register crq--rc 0x%x\n", rc);
 313        }
 314        return rc;
 315}
 316
 317/**
 318 * initialize_crq_queue: - Initializes and registers CRQ with hypervisor
 319 * @queue:      crq_queue to initialize and register
 320 * @hostdata:   ibmvscsi_host_data of host
 321 *
 322 * Allocates a page for messages, maps it for dma, and registers
 323 * the crq with the hypervisor.
 324 * Returns zero on success.
 325 */
 326static int ibmvscsi_init_crq_queue(struct crq_queue *queue,
 327                                   struct ibmvscsi_host_data *hostdata,
 328                                   int max_requests)
 329{
 330        int rc;
 331        int retrc;
 332        struct vio_dev *vdev = to_vio_dev(hostdata->dev);
 333
 334        queue->msgs = (struct viosrp_crq *)get_zeroed_page(GFP_KERNEL);
 335
 336        if (!queue->msgs)
 337                goto malloc_failed;
 338        queue->size = PAGE_SIZE / sizeof(*queue->msgs);
 339
 340        queue->msg_token = dma_map_single(hostdata->dev, queue->msgs,
 341                                          queue->size * sizeof(*queue->msgs),
 342                                          DMA_BIDIRECTIONAL);
 343
 344        if (dma_mapping_error(hostdata->dev, queue->msg_token))
 345                goto map_failed;
 346
 347        gather_partition_info();
 348        set_adapter_info(hostdata);
 349
 350        retrc = rc = plpar_hcall_norets(H_REG_CRQ,
 351                                vdev->unit_address,
 352                                queue->msg_token, PAGE_SIZE);
 353        if (rc == H_RESOURCE)
 354                /* maybe kexecing and resource is busy. try a reset */
 355                rc = ibmvscsi_reset_crq_queue(queue,
 356                                              hostdata);
 357
 358        if (rc == 2) {
 359                /* Adapter is good, but other end is not ready */
 360                dev_warn(hostdata->dev, "Partner adapter not ready\n");
 361                retrc = 0;
 362        } else if (rc != 0) {
 363                dev_warn(hostdata->dev, "Error %d opening adapter\n", rc);
 364                goto reg_crq_failed;
 365        }
 366
 367        queue->cur = 0;
 368        spin_lock_init(&queue->lock);
 369
 370        tasklet_init(&hostdata->srp_task, (void *)ibmvscsi_task,
 371                     (unsigned long)hostdata);
 372
 373        if (request_irq(vdev->irq,
 374                        ibmvscsi_handle_event,
 375                        0, "ibmvscsi", (void *)hostdata) != 0) {
 376                dev_err(hostdata->dev, "couldn't register irq 0x%x\n",
 377                        vdev->irq);
 378                goto req_irq_failed;
 379        }
 380
 381        rc = vio_enable_interrupts(vdev);
 382        if (rc != 0) {
 383                dev_err(hostdata->dev, "Error %d enabling interrupts!!!\n", rc);
 384                goto req_irq_failed;
 385        }
 386
 387        return retrc;
 388
 389      req_irq_failed:
 390        tasklet_kill(&hostdata->srp_task);
 391        rc = 0;
 392        do {
 393                if (rc)
 394                        msleep(100);
 395                rc = plpar_hcall_norets(H_FREE_CRQ, vdev->unit_address);
 396        } while ((rc == H_BUSY) || (H_IS_LONG_BUSY(rc)));
 397      reg_crq_failed:
 398        dma_unmap_single(hostdata->dev,
 399                         queue->msg_token,
 400                         queue->size * sizeof(*queue->msgs), DMA_BIDIRECTIONAL);
 401      map_failed:
 402        free_page((unsigned long)queue->msgs);
 403      malloc_failed:
 404        return -1;
 405}
 406
 407/**
 408 * reenable_crq_queue: - reenables a crq after
 409 * @queue:      crq_queue to initialize and register
 410 * @hostdata:   ibmvscsi_host_data of host
 411 *
 412 */
 413static int ibmvscsi_reenable_crq_queue(struct crq_queue *queue,
 414                                       struct ibmvscsi_host_data *hostdata)
 415{
 416        int rc = 0;
 417        struct vio_dev *vdev = to_vio_dev(hostdata->dev);
 418
 419        /* Re-enable the CRQ */
 420        do {
 421                if (rc)
 422                        msleep(100);
 423                rc = plpar_hcall_norets(H_ENABLE_CRQ, vdev->unit_address);
 424        } while ((rc == H_IN_PROGRESS) || (rc == H_BUSY) || (H_IS_LONG_BUSY(rc)));
 425
 426        if (rc)
 427                dev_err(hostdata->dev, "Error %d enabling adapter\n", rc);
 428        return rc;
 429}
 430
 431/* ------------------------------------------------------------
 432 * Routines for the event pool and event structs
 433 */
 434/**
 435 * initialize_event_pool: - Allocates and initializes the event pool for a host
 436 * @pool:       event_pool to be initialized
 437 * @size:       Number of events in pool
 438 * @hostdata:   ibmvscsi_host_data who owns the event pool
 439 *
 440 * Returns zero on success.
 441*/
 442static int initialize_event_pool(struct event_pool *pool,
 443                                 int size, struct ibmvscsi_host_data *hostdata)
 444{
 445        int i;
 446
 447        pool->size = size;
 448        pool->next = 0;
 449        pool->events = kcalloc(pool->size, sizeof(*pool->events), GFP_KERNEL);
 450        if (!pool->events)
 451                return -ENOMEM;
 452
 453        pool->iu_storage =
 454            dma_alloc_coherent(hostdata->dev,
 455                               pool->size * sizeof(*pool->iu_storage),
 456                               &pool->iu_token, 0);
 457        if (!pool->iu_storage) {
 458                kfree(pool->events);
 459                return -ENOMEM;
 460        }
 461
 462        for (i = 0; i < pool->size; ++i) {
 463                struct srp_event_struct *evt = &pool->events[i];
 464                memset(&evt->crq, 0x00, sizeof(evt->crq));
 465                atomic_set(&evt->free, 1);
 466                evt->crq.valid = 0x80;
 467                evt->crq.IU_length = sizeof(*evt->xfer_iu);
 468                evt->crq.IU_data_ptr = pool->iu_token + 
 469                        sizeof(*evt->xfer_iu) * i;
 470                evt->xfer_iu = pool->iu_storage + i;
 471                evt->hostdata = hostdata;
 472                evt->ext_list = NULL;
 473                evt->ext_list_token = 0;
 474        }
 475
 476        return 0;
 477}
 478
 479/**
 480 * release_event_pool: - Frees memory of an event pool of a host
 481 * @pool:       event_pool to be released
 482 * @hostdata:   ibmvscsi_host_data who owns the even pool
 483 *
 484 * Returns zero on success.
 485*/
 486static void release_event_pool(struct event_pool *pool,
 487                               struct ibmvscsi_host_data *hostdata)
 488{
 489        int i, in_use = 0;
 490        for (i = 0; i < pool->size; ++i) {
 491                if (atomic_read(&pool->events[i].free) != 1)
 492                        ++in_use;
 493                if (pool->events[i].ext_list) {
 494                        dma_free_coherent(hostdata->dev,
 495                                  SG_ALL * sizeof(struct srp_direct_buf),
 496                                  pool->events[i].ext_list,
 497                                  pool->events[i].ext_list_token);
 498                }
 499        }
 500        if (in_use)
 501                dev_warn(hostdata->dev, "releasing event pool with %d "
 502                         "events still in use?\n", in_use);
 503        kfree(pool->events);
 504        dma_free_coherent(hostdata->dev,
 505                          pool->size * sizeof(*pool->iu_storage),
 506                          pool->iu_storage, pool->iu_token);
 507}
 508
 509/**
 510 * valid_event_struct: - Determines if event is valid.
 511 * @pool:       event_pool that contains the event
 512 * @evt:        srp_event_struct to be checked for validity
 513 *
 514 * Returns zero if event is invalid, one otherwise.
 515*/
 516static int valid_event_struct(struct event_pool *pool,
 517                                struct srp_event_struct *evt)
 518{
 519        int index = evt - pool->events;
 520        if (index < 0 || index >= pool->size)   /* outside of bounds */
 521                return 0;
 522        if (evt != pool->events + index)        /* unaligned */
 523                return 0;
 524        return 1;
 525}
 526
 527/**
 528 * ibmvscsi_free-event_struct: - Changes status of event to "free"
 529 * @pool:       event_pool that contains the event
 530 * @evt:        srp_event_struct to be modified
 531 *
 532*/
 533static void free_event_struct(struct event_pool *pool,
 534                                       struct srp_event_struct *evt)
 535{
 536        if (!valid_event_struct(pool, evt)) {
 537                dev_err(evt->hostdata->dev, "Freeing invalid event_struct %p "
 538                        "(not in pool %p)\n", evt, pool->events);
 539                return;
 540        }
 541        if (atomic_inc_return(&evt->free) != 1) {
 542                dev_err(evt->hostdata->dev, "Freeing event_struct %p "
 543                        "which is not in use!\n", evt);
 544                return;
 545        }
 546}
 547
 548/**
 549 * get_evt_struct: - Gets the next free event in pool
 550 * @pool:       event_pool that contains the events to be searched
 551 *
 552 * Returns the next event in "free" state, and NULL if none are free.
 553 * Note that no synchronization is done here, we assume the host_lock
 554 * will syncrhonze things.
 555*/
 556static struct srp_event_struct *get_event_struct(struct event_pool *pool)
 557{
 558        int i;
 559        int poolsize = pool->size;
 560        int offset = pool->next;
 561
 562        for (i = 0; i < poolsize; i++) {
 563                offset = (offset + 1) % poolsize;
 564                if (!atomic_dec_if_positive(&pool->events[offset].free)) {
 565                        pool->next = offset;
 566                        return &pool->events[offset];
 567                }
 568        }
 569
 570        printk(KERN_ERR "ibmvscsi: found no event struct in pool!\n");
 571        return NULL;
 572}
 573
 574/**
 575 * init_event_struct: Initialize fields in an event struct that are always 
 576 *                    required.
 577 * @evt:        The event
 578 * @done:       Routine to call when the event is responded to
 579 * @format:     SRP or MAD format
 580 * @timeout:    timeout value set in the CRQ
 581 */
 582static void init_event_struct(struct srp_event_struct *evt_struct,
 583                              void (*done) (struct srp_event_struct *),
 584                              u8 format,
 585                              int timeout)
 586{
 587        evt_struct->cmnd = NULL;
 588        evt_struct->cmnd_done = NULL;
 589        evt_struct->sync_srp = NULL;
 590        evt_struct->crq.format = format;
 591        evt_struct->crq.timeout = timeout;
 592        evt_struct->done = done;
 593}
 594
 595/* ------------------------------------------------------------
 596 * Routines for receiving SCSI responses from the hosting partition
 597 */
 598
 599/**
 600 * set_srp_direction: Set the fields in the srp related to data
 601 *     direction and number of buffers based on the direction in
 602 *     the scsi_cmnd and the number of buffers
 603 */
 604static void set_srp_direction(struct scsi_cmnd *cmd,
 605                              struct srp_cmd *srp_cmd, 
 606                              int numbuf)
 607{
 608        u8 fmt;
 609
 610        if (numbuf == 0)
 611                return;
 612        
 613        if (numbuf == 1)
 614                fmt = SRP_DATA_DESC_DIRECT;
 615        else {
 616                fmt = SRP_DATA_DESC_INDIRECT;
 617                numbuf = min(numbuf, MAX_INDIRECT_BUFS);
 618
 619                if (cmd->sc_data_direction == DMA_TO_DEVICE)
 620                        srp_cmd->data_out_desc_cnt = numbuf;
 621                else
 622                        srp_cmd->data_in_desc_cnt = numbuf;
 623        }
 624
 625        if (cmd->sc_data_direction == DMA_TO_DEVICE)
 626                srp_cmd->buf_fmt = fmt << 4;
 627        else
 628                srp_cmd->buf_fmt = fmt;
 629}
 630
 631/**
 632 * unmap_cmd_data: - Unmap data pointed in srp_cmd based on the format
 633 * @cmd:        srp_cmd whose additional_data member will be unmapped
 634 * @dev:        device for which the memory is mapped
 635 *
 636*/
 637static void unmap_cmd_data(struct srp_cmd *cmd,
 638                           struct srp_event_struct *evt_struct,
 639                           struct device *dev)
 640{
 641        u8 out_fmt, in_fmt;
 642
 643        out_fmt = cmd->buf_fmt >> 4;
 644        in_fmt = cmd->buf_fmt & ((1U << 4) - 1);
 645
 646        if (out_fmt == SRP_NO_DATA_DESC && in_fmt == SRP_NO_DATA_DESC)
 647                return;
 648
 649        if (evt_struct->cmnd)
 650                scsi_dma_unmap(evt_struct->cmnd);
 651}
 652
 653static int map_sg_list(struct scsi_cmnd *cmd, int nseg,
 654                       struct srp_direct_buf *md)
 655{
 656        int i;
 657        struct scatterlist *sg;
 658        u64 total_length = 0;
 659
 660        scsi_for_each_sg(cmd, sg, nseg, i) {
 661                struct srp_direct_buf *descr = md + i;
 662                descr->va = sg_dma_address(sg);
 663                descr->len = sg_dma_len(sg);
 664                descr->key = 0;
 665                total_length += sg_dma_len(sg);
 666        }
 667        return total_length;
 668}
 669
 670/**
 671 * map_sg_data: - Maps dma for a scatterlist and initializes decriptor fields
 672 * @cmd:        Scsi_Cmnd with the scatterlist
 673 * @srp_cmd:    srp_cmd that contains the memory descriptor
 674 * @dev:        device for which to map dma memory
 675 *
 676 * Called by map_data_for_srp_cmd() when building srp cmd from scsi cmd.
 677 * Returns 1 on success.
 678*/
 679static int map_sg_data(struct scsi_cmnd *cmd,
 680                       struct srp_event_struct *evt_struct,
 681                       struct srp_cmd *srp_cmd, struct device *dev)
 682{
 683
 684        int sg_mapped;
 685        u64 total_length = 0;
 686        struct srp_direct_buf *data =
 687                (struct srp_direct_buf *) srp_cmd->add_data;
 688        struct srp_indirect_buf *indirect =
 689                (struct srp_indirect_buf *) data;
 690
 691        sg_mapped = scsi_dma_map(cmd);
 692        if (!sg_mapped)
 693                return 1;
 694        else if (sg_mapped < 0)
 695                return 0;
 696
 697        set_srp_direction(cmd, srp_cmd, sg_mapped);
 698
 699        /* special case; we can use a single direct descriptor */
 700        if (sg_mapped == 1) {
 701                map_sg_list(cmd, sg_mapped, data);
 702                return 1;
 703        }
 704
 705        indirect->table_desc.va = 0;
 706        indirect->table_desc.len = sg_mapped * sizeof(struct srp_direct_buf);
 707        indirect->table_desc.key = 0;
 708
 709        if (sg_mapped <= MAX_INDIRECT_BUFS) {
 710                total_length = map_sg_list(cmd, sg_mapped,
 711                                           &indirect->desc_list[0]);
 712                indirect->len = total_length;
 713                return 1;
 714        }
 715
 716        /* get indirect table */
 717        if (!evt_struct->ext_list) {
 718                evt_struct->ext_list = (struct srp_direct_buf *)
 719                        dma_alloc_coherent(dev,
 720                                           SG_ALL * sizeof(struct srp_direct_buf),
 721                                           &evt_struct->ext_list_token, 0);
 722                if (!evt_struct->ext_list) {
 723                        if (!firmware_has_feature(FW_FEATURE_CMO))
 724                                sdev_printk(KERN_ERR, cmd->device,
 725                                            "Can't allocate memory "
 726                                            "for indirect table\n");
 727                        scsi_dma_unmap(cmd);
 728                        return 0;
 729                }
 730        }
 731
 732        total_length = map_sg_list(cmd, sg_mapped, evt_struct->ext_list);
 733
 734        indirect->len = total_length;
 735        indirect->table_desc.va = evt_struct->ext_list_token;
 736        indirect->table_desc.len = sg_mapped * sizeof(indirect->desc_list[0]);
 737        memcpy(indirect->desc_list, evt_struct->ext_list,
 738               MAX_INDIRECT_BUFS * sizeof(struct srp_direct_buf));
 739        return 1;
 740}
 741
 742/**
 743 * map_data_for_srp_cmd: - Calls functions to map data for srp cmds
 744 * @cmd:        struct scsi_cmnd with the memory to be mapped
 745 * @srp_cmd:    srp_cmd that contains the memory descriptor
 746 * @dev:        dma device for which to map dma memory
 747 *
 748 * Called by scsi_cmd_to_srp_cmd() when converting scsi cmds to srp cmds 
 749 * Returns 1 on success.
 750*/
 751static int map_data_for_srp_cmd(struct scsi_cmnd *cmd,
 752                                struct srp_event_struct *evt_struct,
 753                                struct srp_cmd *srp_cmd, struct device *dev)
 754{
 755        switch (cmd->sc_data_direction) {
 756        case DMA_FROM_DEVICE:
 757        case DMA_TO_DEVICE:
 758                break;
 759        case DMA_NONE:
 760                return 1;
 761        case DMA_BIDIRECTIONAL:
 762                sdev_printk(KERN_ERR, cmd->device,
 763                            "Can't map DMA_BIDIRECTIONAL to read/write\n");
 764                return 0;
 765        default:
 766                sdev_printk(KERN_ERR, cmd->device,
 767                            "Unknown data direction 0x%02x; can't map!\n",
 768                            cmd->sc_data_direction);
 769                return 0;
 770        }
 771
 772        return map_sg_data(cmd, evt_struct, srp_cmd, dev);
 773}
 774
 775/**
 776 * purge_requests: Our virtual adapter just shut down.  purge any sent requests
 777 * @hostdata:    the adapter
 778 */
 779static void purge_requests(struct ibmvscsi_host_data *hostdata, int error_code)
 780{
 781        struct srp_event_struct *evt;
 782        unsigned long flags;
 783
 784        spin_lock_irqsave(hostdata->host->host_lock, flags);
 785        while (!list_empty(&hostdata->sent)) {
 786                evt = list_first_entry(&hostdata->sent, struct srp_event_struct, list);
 787                list_del(&evt->list);
 788                del_timer(&evt->timer);
 789
 790                spin_unlock_irqrestore(hostdata->host->host_lock, flags);
 791                if (evt->cmnd) {
 792                        evt->cmnd->result = (error_code << 16);
 793                        unmap_cmd_data(&evt->iu.srp.cmd, evt,
 794                                       evt->hostdata->dev);
 795                        if (evt->cmnd_done)
 796                                evt->cmnd_done(evt->cmnd);
 797                } else if (evt->done)
 798                        evt->done(evt);
 799                free_event_struct(&evt->hostdata->pool, evt);
 800                spin_lock_irqsave(hostdata->host->host_lock, flags);
 801        }
 802        spin_unlock_irqrestore(hostdata->host->host_lock, flags);
 803}
 804
 805/**
 806 * ibmvscsi_reset_host - Reset the connection to the server
 807 * @hostdata:   struct ibmvscsi_host_data to reset
 808*/
 809static void ibmvscsi_reset_host(struct ibmvscsi_host_data *hostdata)
 810{
 811        scsi_block_requests(hostdata->host);
 812        atomic_set(&hostdata->request_limit, 0);
 813
 814        purge_requests(hostdata, DID_ERROR);
 815        hostdata->reset_crq = 1;
 816        wake_up(&hostdata->work_wait_q);
 817}
 818
 819/**
 820 * ibmvscsi_timeout - Internal command timeout handler
 821 * @evt_struct: struct srp_event_struct that timed out
 822 *
 823 * Called when an internally generated command times out
 824*/
 825static void ibmvscsi_timeout(struct srp_event_struct *evt_struct)
 826{
 827        struct ibmvscsi_host_data *hostdata = evt_struct->hostdata;
 828
 829        dev_err(hostdata->dev, "Command timed out (%x). Resetting connection\n",
 830                evt_struct->iu.srp.cmd.opcode);
 831
 832        ibmvscsi_reset_host(hostdata);
 833}
 834
 835
 836/* ------------------------------------------------------------
 837 * Routines for sending and receiving SRPs
 838 */
 839/**
 840 * ibmvscsi_send_srp_event: - Transforms event to u64 array and calls send_crq()
 841 * @evt_struct: evt_struct to be sent
 842 * @hostdata:   ibmvscsi_host_data of host
 843 * @timeout:    timeout in seconds - 0 means do not time command
 844 *
 845 * Returns the value returned from ibmvscsi_send_crq(). (Zero for success)
 846 * Note that this routine assumes that host_lock is held for synchronization
 847*/
 848static int ibmvscsi_send_srp_event(struct srp_event_struct *evt_struct,
 849                                   struct ibmvscsi_host_data *hostdata,
 850                                   unsigned long timeout)
 851{
 852        u64 *crq_as_u64 = (u64 *) &evt_struct->crq;
 853        int request_status = 0;
 854        int rc;
 855        int srp_req = 0;
 856
 857        /* If we have exhausted our request limit, just fail this request,
 858         * unless it is for a reset or abort.
 859         * Note that there are rare cases involving driver generated requests 
 860         * (such as task management requests) that the mid layer may think we
 861         * can handle more requests (can_queue) when we actually can't
 862         */
 863        if (evt_struct->crq.format == VIOSRP_SRP_FORMAT) {
 864                srp_req = 1;
 865                request_status =
 866                        atomic_dec_if_positive(&hostdata->request_limit);
 867                /* If request limit was -1 when we started, it is now even
 868                 * less than that
 869                 */
 870                if (request_status < -1)
 871                        goto send_error;
 872                /* Otherwise, we may have run out of requests. */
 873                /* If request limit was 0 when we started the adapter is in the
 874                 * process of performing a login with the server adapter, or
 875                 * we may have run out of requests.
 876                 */
 877                else if (request_status == -1 &&
 878                         evt_struct->iu.srp.login_req.opcode != SRP_LOGIN_REQ)
 879                        goto send_busy;
 880                /* Abort and reset calls should make it through.
 881                 * Nothing except abort and reset should use the last two
 882                 * slots unless we had two or less to begin with.
 883                 */
 884                else if (request_status < 2 &&
 885                         evt_struct->iu.srp.cmd.opcode != SRP_TSK_MGMT) {
 886                        /* In the case that we have less than two requests
 887                         * available, check the server limit as a combination
 888                         * of the request limit and the number of requests
 889                         * in-flight (the size of the send list).  If the
 890                         * server limit is greater than 2, return busy so
 891                         * that the last two are reserved for reset and abort.
 892                         */
 893                        int server_limit = request_status;
 894                        struct srp_event_struct *tmp_evt;
 895
 896                        list_for_each_entry(tmp_evt, &hostdata->sent, list) {
 897                                server_limit++;
 898                        }
 899
 900                        if (server_limit > 2)
 901                                goto send_busy;
 902                }
 903        }
 904
 905        /* Copy the IU into the transfer area */
 906        *evt_struct->xfer_iu = evt_struct->iu;
 907        evt_struct->xfer_iu->srp.rsp.tag = (u64)evt_struct;
 908
 909        /* Add this to the sent list.  We need to do this 
 910         * before we actually send 
 911         * in case it comes back REALLY fast
 912         */
 913        list_add_tail(&evt_struct->list, &hostdata->sent);
 914
 915        init_timer(&evt_struct->timer);
 916        if (timeout) {
 917                evt_struct->timer.data = (unsigned long) evt_struct;
 918                evt_struct->timer.expires = jiffies + (timeout * HZ);
 919                evt_struct->timer.function = (void (*)(unsigned long))ibmvscsi_timeout;
 920                add_timer(&evt_struct->timer);
 921        }
 922
 923        if ((rc =
 924             ibmvscsi_send_crq(hostdata, crq_as_u64[0], crq_as_u64[1])) != 0) {
 925                list_del(&evt_struct->list);
 926                del_timer(&evt_struct->timer);
 927
 928                /* If send_crq returns H_CLOSED, return SCSI_MLQUEUE_HOST_BUSY.
 929                 * Firmware will send a CRQ with a transport event (0xFF) to
 930                 * tell this client what has happened to the transport.  This
 931                 * will be handled in ibmvscsi_handle_crq()
 932                 */
 933                if (rc == H_CLOSED) {
 934                        dev_warn(hostdata->dev, "send warning. "
 935                                 "Receive queue closed, will retry.\n");
 936                        goto send_busy;
 937                }
 938                dev_err(hostdata->dev, "send error %d\n", rc);
 939                if (srp_req)
 940                        atomic_inc(&hostdata->request_limit);
 941                goto send_error;
 942        }
 943
 944        return 0;
 945
 946 send_busy:
 947        unmap_cmd_data(&evt_struct->iu.srp.cmd, evt_struct, hostdata->dev);
 948
 949        free_event_struct(&hostdata->pool, evt_struct);
 950        if (srp_req && request_status != -1)
 951                atomic_inc(&hostdata->request_limit);
 952        return SCSI_MLQUEUE_HOST_BUSY;
 953
 954 send_error:
 955        unmap_cmd_data(&evt_struct->iu.srp.cmd, evt_struct, hostdata->dev);
 956
 957        if (evt_struct->cmnd != NULL) {
 958                evt_struct->cmnd->result = DID_ERROR << 16;
 959                evt_struct->cmnd_done(evt_struct->cmnd);
 960        } else if (evt_struct->done)
 961                evt_struct->done(evt_struct);
 962
 963        free_event_struct(&hostdata->pool, evt_struct);
 964        return 0;
 965}
 966
 967/**
 968 * handle_cmd_rsp: -  Handle responses from commands
 969 * @evt_struct: srp_event_struct to be handled
 970 *
 971 * Used as a callback by when sending scsi cmds.
 972 * Gets called by ibmvscsi_handle_crq()
 973*/
 974static void handle_cmd_rsp(struct srp_event_struct *evt_struct)
 975{
 976        struct srp_rsp *rsp = &evt_struct->xfer_iu->srp.rsp;
 977        struct scsi_cmnd *cmnd = evt_struct->cmnd;
 978
 979        if (unlikely(rsp->opcode != SRP_RSP)) {
 980                if (printk_ratelimit())
 981                        dev_warn(evt_struct->hostdata->dev,
 982                                 "bad SRP RSP type %d\n", rsp->opcode);
 983        }
 984        
 985        if (cmnd) {
 986                cmnd->result |= rsp->status;
 987                if (((cmnd->result >> 1) & 0x1f) == CHECK_CONDITION)
 988                        memcpy(cmnd->sense_buffer,
 989                               rsp->data,
 990                               rsp->sense_data_len);
 991                unmap_cmd_data(&evt_struct->iu.srp.cmd, 
 992                               evt_struct, 
 993                               evt_struct->hostdata->dev);
 994
 995                if (rsp->flags & SRP_RSP_FLAG_DOOVER)
 996                        scsi_set_resid(cmnd, rsp->data_out_res_cnt);
 997                else if (rsp->flags & SRP_RSP_FLAG_DIOVER)
 998                        scsi_set_resid(cmnd, rsp->data_in_res_cnt);
 999        }
1000
1001        if (evt_struct->cmnd_done)
1002                evt_struct->cmnd_done(cmnd);
1003}
1004
1005/**
1006 * lun_from_dev: - Returns the lun of the scsi device
1007 * @dev:        struct scsi_device
1008 *
1009*/
1010static inline u16 lun_from_dev(struct scsi_device *dev)
1011{
1012        return (0x2 << 14) | (dev->id << 8) | (dev->channel << 5) | dev->lun;
1013}
1014
1015/**
1016 * ibmvscsi_queue: - The queuecommand function of the scsi template 
1017 * @cmd:        struct scsi_cmnd to be executed
1018 * @done:       Callback function to be called when cmd is completed
1019*/
1020static int ibmvscsi_queuecommand_lck(struct scsi_cmnd *cmnd,
1021                                 void (*done) (struct scsi_cmnd *))
1022{
1023        struct srp_cmd *srp_cmd;
1024        struct srp_event_struct *evt_struct;
1025        struct srp_indirect_buf *indirect;
1026        struct ibmvscsi_host_data *hostdata = shost_priv(cmnd->device->host);
1027        u16 lun = lun_from_dev(cmnd->device);
1028        u8 out_fmt, in_fmt;
1029
1030        cmnd->result = (DID_OK << 16);
1031        evt_struct = get_event_struct(&hostdata->pool);
1032        if (!evt_struct)
1033                return SCSI_MLQUEUE_HOST_BUSY;
1034
1035        /* Set up the actual SRP IU */
1036        srp_cmd = &evt_struct->iu.srp.cmd;
1037        memset(srp_cmd, 0x00, SRP_MAX_IU_LEN);
1038        srp_cmd->opcode = SRP_CMD;
1039        memcpy(srp_cmd->cdb, cmnd->cmnd, sizeof(srp_cmd->cdb));
1040        srp_cmd->lun = ((u64) lun) << 48;
1041
1042        if (!map_data_for_srp_cmd(cmnd, evt_struct, srp_cmd, hostdata->dev)) {
1043                if (!firmware_has_feature(FW_FEATURE_CMO))
1044                        sdev_printk(KERN_ERR, cmnd->device,
1045                                    "couldn't convert cmd to srp_cmd\n");
1046                free_event_struct(&hostdata->pool, evt_struct);
1047                return SCSI_MLQUEUE_HOST_BUSY;
1048        }
1049
1050        init_event_struct(evt_struct,
1051                          handle_cmd_rsp,
1052                          VIOSRP_SRP_FORMAT,
1053                          cmnd->request->timeout/HZ);
1054
1055        evt_struct->cmnd = cmnd;
1056        evt_struct->cmnd_done = done;
1057
1058        /* Fix up dma address of the buffer itself */
1059        indirect = (struct srp_indirect_buf *) srp_cmd->add_data;
1060        out_fmt = srp_cmd->buf_fmt >> 4;
1061        in_fmt = srp_cmd->buf_fmt & ((1U << 4) - 1);
1062        if ((in_fmt == SRP_DATA_DESC_INDIRECT ||
1063             out_fmt == SRP_DATA_DESC_INDIRECT) &&
1064            indirect->table_desc.va == 0) {
1065                indirect->table_desc.va = evt_struct->crq.IU_data_ptr +
1066                        offsetof(struct srp_cmd, add_data) +
1067                        offsetof(struct srp_indirect_buf, desc_list);
1068        }
1069
1070        return ibmvscsi_send_srp_event(evt_struct, hostdata, 0);
1071}
1072
1073static DEF_SCSI_QCMD(ibmvscsi_queuecommand)
1074
1075/* ------------------------------------------------------------
1076 * Routines for driver initialization
1077 */
1078
1079/**
1080 * map_persist_bufs: - Pre-map persistent data for adapter logins
1081 * @hostdata:   ibmvscsi_host_data of host
1082 *
1083 * Map the capabilities and adapter info DMA buffers to avoid runtime failures.
1084 * Return 1 on error, 0 on success.
1085 */
1086static int map_persist_bufs(struct ibmvscsi_host_data *hostdata)
1087{
1088
1089        hostdata->caps_addr = dma_map_single(hostdata->dev, &hostdata->caps,
1090                                             sizeof(hostdata->caps), DMA_BIDIRECTIONAL);
1091
1092        if (dma_mapping_error(hostdata->dev, hostdata->caps_addr)) {
1093                dev_err(hostdata->dev, "Unable to map capabilities buffer!\n");
1094                return 1;
1095        }
1096
1097        hostdata->adapter_info_addr = dma_map_single(hostdata->dev,
1098                                                     &hostdata->madapter_info,
1099                                                     sizeof(hostdata->madapter_info),
1100                                                     DMA_BIDIRECTIONAL);
1101        if (dma_mapping_error(hostdata->dev, hostdata->adapter_info_addr)) {
1102                dev_err(hostdata->dev, "Unable to map adapter info buffer!\n");
1103                dma_unmap_single(hostdata->dev, hostdata->caps_addr,
1104                                 sizeof(hostdata->caps), DMA_BIDIRECTIONAL);
1105                return 1;
1106        }
1107
1108        return 0;
1109}
1110
1111/**
1112 * unmap_persist_bufs: - Unmap persistent data needed for adapter logins
1113 * @hostdata:   ibmvscsi_host_data of host
1114 *
1115 * Unmap the capabilities and adapter info DMA buffers
1116 */
1117static void unmap_persist_bufs(struct ibmvscsi_host_data *hostdata)
1118{
1119        dma_unmap_single(hostdata->dev, hostdata->caps_addr,
1120                         sizeof(hostdata->caps), DMA_BIDIRECTIONAL);
1121
1122        dma_unmap_single(hostdata->dev, hostdata->adapter_info_addr,
1123                         sizeof(hostdata->madapter_info), DMA_BIDIRECTIONAL);
1124}
1125
1126/**
1127 * login_rsp: - Handle response to SRP login request
1128 * @evt_struct: srp_event_struct with the response
1129 *
1130 * Used as a "done" callback by when sending srp_login. Gets called
1131 * by ibmvscsi_handle_crq()
1132*/
1133static void login_rsp(struct srp_event_struct *evt_struct)
1134{
1135        struct ibmvscsi_host_data *hostdata = evt_struct->hostdata;
1136        switch (evt_struct->xfer_iu->srp.login_rsp.opcode) {
1137        case SRP_LOGIN_RSP:     /* it worked! */
1138                break;
1139        case SRP_LOGIN_REJ:     /* refused! */
1140                dev_info(hostdata->dev, "SRP_LOGIN_REJ reason %u\n",
1141                         evt_struct->xfer_iu->srp.login_rej.reason);
1142                /* Login failed.  */
1143                atomic_set(&hostdata->request_limit, -1);
1144                return;
1145        default:
1146                dev_err(hostdata->dev, "Invalid login response typecode 0x%02x!\n",
1147                        evt_struct->xfer_iu->srp.login_rsp.opcode);
1148                /* Login failed.  */
1149                atomic_set(&hostdata->request_limit, -1);
1150                return;
1151        }
1152
1153        dev_info(hostdata->dev, "SRP_LOGIN succeeded\n");
1154        hostdata->client_migrated = 0;
1155
1156        /* Now we know what the real request-limit is.
1157         * This value is set rather than added to request_limit because
1158         * request_limit could have been set to -1 by this client.
1159         */
1160        atomic_set(&hostdata->request_limit,
1161                   evt_struct->xfer_iu->srp.login_rsp.req_lim_delta);
1162
1163        /* If we had any pending I/Os, kick them */
1164        scsi_unblock_requests(hostdata->host);
1165}
1166
1167/**
1168 * send_srp_login: - Sends the srp login
1169 * @hostdata:   ibmvscsi_host_data of host
1170 *
1171 * Returns zero if successful.
1172*/
1173static int send_srp_login(struct ibmvscsi_host_data *hostdata)
1174{
1175        int rc;
1176        unsigned long flags;
1177        struct srp_login_req *login;
1178        struct srp_event_struct *evt_struct = get_event_struct(&hostdata->pool);
1179
1180        BUG_ON(!evt_struct);
1181        init_event_struct(evt_struct, login_rsp,
1182                          VIOSRP_SRP_FORMAT, login_timeout);
1183
1184        login = &evt_struct->iu.srp.login_req;
1185        memset(login, 0, sizeof(*login));
1186        login->opcode = SRP_LOGIN_REQ;
1187        login->req_it_iu_len = sizeof(union srp_iu);
1188        login->req_buf_fmt = SRP_BUF_FORMAT_DIRECT | SRP_BUF_FORMAT_INDIRECT;
1189
1190        spin_lock_irqsave(hostdata->host->host_lock, flags);
1191        /* Start out with a request limit of 0, since this is negotiated in
1192         * the login request we are just sending and login requests always
1193         * get sent by the driver regardless of request_limit.
1194         */
1195        atomic_set(&hostdata->request_limit, 0);
1196
1197        rc = ibmvscsi_send_srp_event(evt_struct, hostdata, login_timeout * 2);
1198        spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1199        dev_info(hostdata->dev, "sent SRP login\n");
1200        return rc;
1201};
1202
1203/**
1204 * capabilities_rsp: - Handle response to MAD adapter capabilities request
1205 * @evt_struct: srp_event_struct with the response
1206 *
1207 * Used as a "done" callback by when sending adapter_info.
1208 */
1209static void capabilities_rsp(struct srp_event_struct *evt_struct)
1210{
1211        struct ibmvscsi_host_data *hostdata = evt_struct->hostdata;
1212
1213        if (evt_struct->xfer_iu->mad.capabilities.common.status) {
1214                dev_err(hostdata->dev, "error 0x%X getting capabilities info\n",
1215                        evt_struct->xfer_iu->mad.capabilities.common.status);
1216        } else {
1217                if (hostdata->caps.migration.common.server_support != SERVER_SUPPORTS_CAP)
1218                        dev_info(hostdata->dev, "Partition migration not supported\n");
1219
1220                if (client_reserve) {
1221                        if (hostdata->caps.reserve.common.server_support ==
1222                            SERVER_SUPPORTS_CAP)
1223                                dev_info(hostdata->dev, "Client reserve enabled\n");
1224                        else
1225                                dev_info(hostdata->dev, "Client reserve not supported\n");
1226                }
1227        }
1228
1229        send_srp_login(hostdata);
1230}
1231
1232/**
1233 * send_mad_capabilities: - Sends the mad capabilities request
1234 *      and stores the result so it can be retrieved with
1235 * @hostdata:   ibmvscsi_host_data of host
1236 */
1237static void send_mad_capabilities(struct ibmvscsi_host_data *hostdata)
1238{
1239        struct viosrp_capabilities *req;
1240        struct srp_event_struct *evt_struct;
1241        unsigned long flags;
1242        struct device_node *of_node = hostdata->dev->of_node;
1243        const char *location;
1244
1245        evt_struct = get_event_struct(&hostdata->pool);
1246        BUG_ON(!evt_struct);
1247
1248        init_event_struct(evt_struct, capabilities_rsp,
1249                          VIOSRP_MAD_FORMAT, info_timeout);
1250
1251        req = &evt_struct->iu.mad.capabilities;
1252        memset(req, 0, sizeof(*req));
1253
1254        hostdata->caps.flags = CAP_LIST_SUPPORTED;
1255        if (hostdata->client_migrated)
1256                hostdata->caps.flags |= CLIENT_MIGRATED;
1257
1258        strncpy(hostdata->caps.name, dev_name(&hostdata->host->shost_gendev),
1259                sizeof(hostdata->caps.name));
1260        hostdata->caps.name[sizeof(hostdata->caps.name) - 1] = '\0';
1261
1262        location = of_get_property(of_node, "ibm,loc-code", NULL);
1263        location = location ? location : dev_name(hostdata->dev);
1264        strncpy(hostdata->caps.loc, location, sizeof(hostdata->caps.loc));
1265        hostdata->caps.loc[sizeof(hostdata->caps.loc) - 1] = '\0';
1266
1267        req->common.type = VIOSRP_CAPABILITIES_TYPE;
1268        req->buffer = hostdata->caps_addr;
1269
1270        hostdata->caps.migration.common.cap_type = MIGRATION_CAPABILITIES;
1271        hostdata->caps.migration.common.length = sizeof(hostdata->caps.migration);
1272        hostdata->caps.migration.common.server_support = SERVER_SUPPORTS_CAP;
1273        hostdata->caps.migration.ecl = 1;
1274
1275        if (client_reserve) {
1276                hostdata->caps.reserve.common.cap_type = RESERVATION_CAPABILITIES;
1277                hostdata->caps.reserve.common.length = sizeof(hostdata->caps.reserve);
1278                hostdata->caps.reserve.common.server_support = SERVER_SUPPORTS_CAP;
1279                hostdata->caps.reserve.type = CLIENT_RESERVE_SCSI_2;
1280                req->common.length = sizeof(hostdata->caps);
1281        } else
1282                req->common.length = sizeof(hostdata->caps) - sizeof(hostdata->caps.reserve);
1283
1284        spin_lock_irqsave(hostdata->host->host_lock, flags);
1285        if (ibmvscsi_send_srp_event(evt_struct, hostdata, info_timeout * 2))
1286                dev_err(hostdata->dev, "couldn't send CAPABILITIES_REQ!\n");
1287        spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1288};
1289
1290/**
1291 * fast_fail_rsp: - Handle response to MAD enable fast fail
1292 * @evt_struct: srp_event_struct with the response
1293 *
1294 * Used as a "done" callback by when sending enable fast fail. Gets called
1295 * by ibmvscsi_handle_crq()
1296 */
1297static void fast_fail_rsp(struct srp_event_struct *evt_struct)
1298{
1299        struct ibmvscsi_host_data *hostdata = evt_struct->hostdata;
1300        u8 status = evt_struct->xfer_iu->mad.fast_fail.common.status;
1301
1302        if (status == VIOSRP_MAD_NOT_SUPPORTED)
1303                dev_err(hostdata->dev, "fast_fail not supported in server\n");
1304        else if (status == VIOSRP_MAD_FAILED)
1305                dev_err(hostdata->dev, "fast_fail request failed\n");
1306        else if (status != VIOSRP_MAD_SUCCESS)
1307                dev_err(hostdata->dev, "error 0x%X enabling fast_fail\n", status);
1308
1309        send_mad_capabilities(hostdata);
1310}
1311
1312/**
1313 * init_host - Start host initialization
1314 * @hostdata:   ibmvscsi_host_data of host
1315 *
1316 * Returns zero if successful.
1317 */
1318static int enable_fast_fail(struct ibmvscsi_host_data *hostdata)
1319{
1320        int rc;
1321        unsigned long flags;
1322        struct viosrp_fast_fail *fast_fail_mad;
1323        struct srp_event_struct *evt_struct;
1324
1325        if (!fast_fail) {
1326                send_mad_capabilities(hostdata);
1327                return 0;
1328        }
1329
1330        evt_struct = get_event_struct(&hostdata->pool);
1331        BUG_ON(!evt_struct);
1332
1333        init_event_struct(evt_struct, fast_fail_rsp, VIOSRP_MAD_FORMAT, info_timeout);
1334
1335        fast_fail_mad = &evt_struct->iu.mad.fast_fail;
1336        memset(fast_fail_mad, 0, sizeof(*fast_fail_mad));
1337        fast_fail_mad->common.type = VIOSRP_ENABLE_FAST_FAIL;
1338        fast_fail_mad->common.length = sizeof(*fast_fail_mad);
1339
1340        spin_lock_irqsave(hostdata->host->host_lock, flags);
1341        rc = ibmvscsi_send_srp_event(evt_struct, hostdata, info_timeout * 2);
1342        spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1343        return rc;
1344}
1345
1346/**
1347 * adapter_info_rsp: - Handle response to MAD adapter info request
1348 * @evt_struct: srp_event_struct with the response
1349 *
1350 * Used as a "done" callback by when sending adapter_info. Gets called
1351 * by ibmvscsi_handle_crq()
1352*/
1353static void adapter_info_rsp(struct srp_event_struct *evt_struct)
1354{
1355        struct ibmvscsi_host_data *hostdata = evt_struct->hostdata;
1356
1357        if (evt_struct->xfer_iu->mad.adapter_info.common.status) {
1358                dev_err(hostdata->dev, "error %d getting adapter info\n",
1359                        evt_struct->xfer_iu->mad.adapter_info.common.status);
1360        } else {
1361                dev_info(hostdata->dev, "host srp version: %s, "
1362                         "host partition %s (%d), OS %d, max io %u\n",
1363                         hostdata->madapter_info.srp_version,
1364                         hostdata->madapter_info.partition_name,
1365                         hostdata->madapter_info.partition_number,
1366                         hostdata->madapter_info.os_type,
1367                         hostdata->madapter_info.port_max_txu[0]);
1368                
1369                if (hostdata->madapter_info.port_max_txu[0]) 
1370                        hostdata->host->max_sectors = 
1371                                hostdata->madapter_info.port_max_txu[0] >> 9;
1372                
1373                if (hostdata->madapter_info.os_type == 3 &&
1374                    strcmp(hostdata->madapter_info.srp_version, "1.6a") <= 0) {
1375                        dev_err(hostdata->dev, "host (Ver. %s) doesn't support large transfers\n",
1376                                hostdata->madapter_info.srp_version);
1377                        dev_err(hostdata->dev, "limiting scatterlists to %d\n",
1378                                MAX_INDIRECT_BUFS);
1379                        hostdata->host->sg_tablesize = MAX_INDIRECT_BUFS;
1380                }
1381
1382                if (hostdata->madapter_info.os_type == 3) {
1383                        enable_fast_fail(hostdata);
1384                        return;
1385                }
1386        }
1387
1388        send_srp_login(hostdata);
1389}
1390
1391/**
1392 * send_mad_adapter_info: - Sends the mad adapter info request
1393 *      and stores the result so it can be retrieved with
1394 *      sysfs.  We COULD consider causing a failure if the
1395 *      returned SRP version doesn't match ours.
1396 * @hostdata:   ibmvscsi_host_data of host
1397 * 
1398 * Returns zero if successful.
1399*/
1400static void send_mad_adapter_info(struct ibmvscsi_host_data *hostdata)
1401{
1402        struct viosrp_adapter_info *req;
1403        struct srp_event_struct *evt_struct;
1404        unsigned long flags;
1405
1406        evt_struct = get_event_struct(&hostdata->pool);
1407        BUG_ON(!evt_struct);
1408
1409        init_event_struct(evt_struct,
1410                          adapter_info_rsp,
1411                          VIOSRP_MAD_FORMAT,
1412                          info_timeout);
1413        
1414        req = &evt_struct->iu.mad.adapter_info;
1415        memset(req, 0x00, sizeof(*req));
1416        
1417        req->common.type = VIOSRP_ADAPTER_INFO_TYPE;
1418        req->common.length = sizeof(hostdata->madapter_info);
1419        req->buffer = hostdata->adapter_info_addr;
1420
1421        spin_lock_irqsave(hostdata->host->host_lock, flags);
1422        if (ibmvscsi_send_srp_event(evt_struct, hostdata, info_timeout * 2))
1423                dev_err(hostdata->dev, "couldn't send ADAPTER_INFO_REQ!\n");
1424        spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1425};
1426
1427/**
1428 * init_adapter: Start virtual adapter initialization sequence
1429 *
1430 */
1431static void init_adapter(struct ibmvscsi_host_data *hostdata)
1432{
1433        send_mad_adapter_info(hostdata);
1434}
1435
1436/**
1437 * sync_completion: Signal that a synchronous command has completed
1438 * Note that after returning from this call, the evt_struct is freed.
1439 * the caller waiting on this completion shouldn't touch the evt_struct
1440 * again.
1441 */
1442static void sync_completion(struct srp_event_struct *evt_struct)
1443{
1444        /* copy the response back */
1445        if (evt_struct->sync_srp)
1446                *evt_struct->sync_srp = *evt_struct->xfer_iu;
1447        
1448        complete(&evt_struct->comp);
1449}
1450
1451/**
1452 * ibmvscsi_abort: Abort a command...from scsi host template
1453 * send this over to the server and wait synchronously for the response
1454 */
1455static int ibmvscsi_eh_abort_handler(struct scsi_cmnd *cmd)
1456{
1457        struct ibmvscsi_host_data *hostdata = shost_priv(cmd->device->host);
1458        struct srp_tsk_mgmt *tsk_mgmt;
1459        struct srp_event_struct *evt;
1460        struct srp_event_struct *tmp_evt, *found_evt;
1461        union viosrp_iu srp_rsp;
1462        int rsp_rc;
1463        unsigned long flags;
1464        u16 lun = lun_from_dev(cmd->device);
1465        unsigned long wait_switch = 0;
1466
1467        /* First, find this command in our sent list so we can figure
1468         * out the correct tag
1469         */
1470        spin_lock_irqsave(hostdata->host->host_lock, flags);
1471        wait_switch = jiffies + (init_timeout * HZ);
1472        do {
1473                found_evt = NULL;
1474                list_for_each_entry(tmp_evt, &hostdata->sent, list) {
1475                        if (tmp_evt->cmnd == cmd) {
1476                                found_evt = tmp_evt;
1477                                break;
1478                        }
1479                }
1480
1481                if (!found_evt) {
1482                        spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1483                        return SUCCESS;
1484                }
1485
1486                evt = get_event_struct(&hostdata->pool);
1487                if (evt == NULL) {
1488                        spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1489                        sdev_printk(KERN_ERR, cmd->device,
1490                                "failed to allocate abort event\n");
1491                        return FAILED;
1492                }
1493        
1494                init_event_struct(evt,
1495                                  sync_completion,
1496                                  VIOSRP_SRP_FORMAT,
1497                                  abort_timeout);
1498
1499                tsk_mgmt = &evt->iu.srp.tsk_mgmt;
1500        
1501                /* Set up an abort SRP command */
1502                memset(tsk_mgmt, 0x00, sizeof(*tsk_mgmt));
1503                tsk_mgmt->opcode = SRP_TSK_MGMT;
1504                tsk_mgmt->lun = ((u64) lun) << 48;
1505                tsk_mgmt->tsk_mgmt_func = SRP_TSK_ABORT_TASK;
1506                tsk_mgmt->task_tag = (u64) found_evt;
1507
1508                evt->sync_srp = &srp_rsp;
1509
1510                init_completion(&evt->comp);
1511                rsp_rc = ibmvscsi_send_srp_event(evt, hostdata, abort_timeout * 2);
1512
1513                if (rsp_rc != SCSI_MLQUEUE_HOST_BUSY)
1514                        break;
1515
1516                spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1517                msleep(10);
1518                spin_lock_irqsave(hostdata->host->host_lock, flags);
1519        } while (time_before(jiffies, wait_switch));
1520
1521        spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1522
1523        if (rsp_rc != 0) {
1524                sdev_printk(KERN_ERR, cmd->device,
1525                            "failed to send abort() event. rc=%d\n", rsp_rc);
1526                return FAILED;
1527        }
1528
1529        sdev_printk(KERN_INFO, cmd->device,
1530                    "aborting command. lun 0x%llx, tag 0x%llx\n",
1531                    (((u64) lun) << 48), (u64) found_evt);
1532
1533        wait_for_completion(&evt->comp);
1534
1535        /* make sure we got a good response */
1536        if (unlikely(srp_rsp.srp.rsp.opcode != SRP_RSP)) {
1537                if (printk_ratelimit())
1538                        sdev_printk(KERN_WARNING, cmd->device, "abort bad SRP RSP type %d\n",
1539                                    srp_rsp.srp.rsp.opcode);
1540                return FAILED;
1541        }
1542
1543        if (srp_rsp.srp.rsp.flags & SRP_RSP_FLAG_RSPVALID)
1544                rsp_rc = *((int *)srp_rsp.srp.rsp.data);
1545        else
1546                rsp_rc = srp_rsp.srp.rsp.status;
1547
1548        if (rsp_rc) {
1549                if (printk_ratelimit())
1550                        sdev_printk(KERN_WARNING, cmd->device,
1551                                    "abort code %d for task tag 0x%llx\n",
1552                                    rsp_rc, tsk_mgmt->task_tag);
1553                return FAILED;
1554        }
1555
1556        /* Because we dropped the spinlock above, it's possible
1557         * The event is no longer in our list.  Make sure it didn't
1558         * complete while we were aborting
1559         */
1560        spin_lock_irqsave(hostdata->host->host_lock, flags);
1561        found_evt = NULL;
1562        list_for_each_entry(tmp_evt, &hostdata->sent, list) {
1563                if (tmp_evt->cmnd == cmd) {
1564                        found_evt = tmp_evt;
1565                        break;
1566                }
1567        }
1568
1569        if (found_evt == NULL) {
1570                spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1571                sdev_printk(KERN_INFO, cmd->device, "aborted task tag 0x%llx completed\n",
1572                            tsk_mgmt->task_tag);
1573                return SUCCESS;
1574        }
1575
1576        sdev_printk(KERN_INFO, cmd->device, "successfully aborted task tag 0x%llx\n",
1577                    tsk_mgmt->task_tag);
1578
1579        cmd->result = (DID_ABORT << 16);
1580        list_del(&found_evt->list);
1581        unmap_cmd_data(&found_evt->iu.srp.cmd, found_evt,
1582                       found_evt->hostdata->dev);
1583        free_event_struct(&found_evt->hostdata->pool, found_evt);
1584        spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1585        atomic_inc(&hostdata->request_limit);
1586        return SUCCESS;
1587}
1588
1589/**
1590 * ibmvscsi_eh_device_reset_handler: Reset a single LUN...from scsi host 
1591 * template send this over to the server and wait synchronously for the 
1592 * response
1593 */
1594static int ibmvscsi_eh_device_reset_handler(struct scsi_cmnd *cmd)
1595{
1596        struct ibmvscsi_host_data *hostdata = shost_priv(cmd->device->host);
1597        struct srp_tsk_mgmt *tsk_mgmt;
1598        struct srp_event_struct *evt;
1599        struct srp_event_struct *tmp_evt, *pos;
1600        union viosrp_iu srp_rsp;
1601        int rsp_rc;
1602        unsigned long flags;
1603        u16 lun = lun_from_dev(cmd->device);
1604        unsigned long wait_switch = 0;
1605
1606        spin_lock_irqsave(hostdata->host->host_lock, flags);
1607        wait_switch = jiffies + (init_timeout * HZ);
1608        do {
1609                evt = get_event_struct(&hostdata->pool);
1610                if (evt == NULL) {
1611                        spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1612                        sdev_printk(KERN_ERR, cmd->device,
1613                                "failed to allocate reset event\n");
1614                        return FAILED;
1615                }
1616        
1617                init_event_struct(evt,
1618                                  sync_completion,
1619                                  VIOSRP_SRP_FORMAT,
1620                                  reset_timeout);
1621
1622                tsk_mgmt = &evt->iu.srp.tsk_mgmt;
1623
1624                /* Set up a lun reset SRP command */
1625                memset(tsk_mgmt, 0x00, sizeof(*tsk_mgmt));
1626                tsk_mgmt->opcode = SRP_TSK_MGMT;
1627                tsk_mgmt->lun = ((u64) lun) << 48;
1628                tsk_mgmt->tsk_mgmt_func = SRP_TSK_LUN_RESET;
1629
1630                evt->sync_srp = &srp_rsp;
1631
1632                init_completion(&evt->comp);
1633                rsp_rc = ibmvscsi_send_srp_event(evt, hostdata, reset_timeout * 2);
1634
1635                if (rsp_rc != SCSI_MLQUEUE_HOST_BUSY)
1636                        break;
1637
1638                spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1639                msleep(10);
1640                spin_lock_irqsave(hostdata->host->host_lock, flags);
1641        } while (time_before(jiffies, wait_switch));
1642
1643        spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1644
1645        if (rsp_rc != 0) {
1646                sdev_printk(KERN_ERR, cmd->device,
1647                            "failed to send reset event. rc=%d\n", rsp_rc);
1648                return FAILED;
1649        }
1650
1651        sdev_printk(KERN_INFO, cmd->device, "resetting device. lun 0x%llx\n",
1652                    (((u64) lun) << 48));
1653
1654        wait_for_completion(&evt->comp);
1655
1656        /* make sure we got a good response */
1657        if (unlikely(srp_rsp.srp.rsp.opcode != SRP_RSP)) {
1658                if (printk_ratelimit())
1659                        sdev_printk(KERN_WARNING, cmd->device, "reset bad SRP RSP type %d\n",
1660                                    srp_rsp.srp.rsp.opcode);
1661                return FAILED;
1662        }
1663
1664        if (srp_rsp.srp.rsp.flags & SRP_RSP_FLAG_RSPVALID)
1665                rsp_rc = *((int *)srp_rsp.srp.rsp.data);
1666        else
1667                rsp_rc = srp_rsp.srp.rsp.status;
1668
1669        if (rsp_rc) {
1670                if (printk_ratelimit())
1671                        sdev_printk(KERN_WARNING, cmd->device,
1672                                    "reset code %d for task tag 0x%llx\n",
1673                                    rsp_rc, tsk_mgmt->task_tag);
1674                return FAILED;
1675        }
1676
1677        /* We need to find all commands for this LUN that have not yet been
1678         * responded to, and fail them with DID_RESET
1679         */
1680        spin_lock_irqsave(hostdata->host->host_lock, flags);
1681        list_for_each_entry_safe(tmp_evt, pos, &hostdata->sent, list) {
1682                if ((tmp_evt->cmnd) && (tmp_evt->cmnd->device == cmd->device)) {
1683                        if (tmp_evt->cmnd)
1684                                tmp_evt->cmnd->result = (DID_RESET << 16);
1685                        list_del(&tmp_evt->list);
1686                        unmap_cmd_data(&tmp_evt->iu.srp.cmd, tmp_evt,
1687                                       tmp_evt->hostdata->dev);
1688                        free_event_struct(&tmp_evt->hostdata->pool,
1689                                                   tmp_evt);
1690                        atomic_inc(&hostdata->request_limit);
1691                        if (tmp_evt->cmnd_done)
1692                                tmp_evt->cmnd_done(tmp_evt->cmnd);
1693                        else if (tmp_evt->done)
1694                                tmp_evt->done(tmp_evt);
1695                }
1696        }
1697        spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1698        return SUCCESS;
1699}
1700
1701/**
1702 * ibmvscsi_eh_host_reset_handler - Reset the connection to the server
1703 * @cmd:        struct scsi_cmnd having problems
1704*/
1705static int ibmvscsi_eh_host_reset_handler(struct scsi_cmnd *cmd)
1706{
1707        unsigned long wait_switch = 0;
1708        struct ibmvscsi_host_data *hostdata = shost_priv(cmd->device->host);
1709
1710        dev_err(hostdata->dev, "Resetting connection due to error recovery\n");
1711
1712        ibmvscsi_reset_host(hostdata);
1713
1714        for (wait_switch = jiffies + (init_timeout * HZ);
1715             time_before(jiffies, wait_switch) &&
1716                     atomic_read(&hostdata->request_limit) < 2;) {
1717
1718                msleep(10);
1719        }
1720
1721        if (atomic_read(&hostdata->request_limit) <= 0)
1722                return FAILED;
1723
1724        return SUCCESS;
1725}
1726
1727/**
1728 * ibmvscsi_handle_crq: - Handles and frees received events in the CRQ
1729 * @crq:        Command/Response queue
1730 * @hostdata:   ibmvscsi_host_data of host
1731 *
1732*/
1733static void ibmvscsi_handle_crq(struct viosrp_crq *crq,
1734                                struct ibmvscsi_host_data *hostdata)
1735{
1736        long rc;
1737        unsigned long flags;
1738        struct srp_event_struct *evt_struct =
1739            (struct srp_event_struct *)crq->IU_data_ptr;
1740        switch (crq->valid) {
1741        case 0xC0:              /* initialization */
1742                switch (crq->format) {
1743                case 0x01:      /* Initialization message */
1744                        dev_info(hostdata->dev, "partner initialized\n");
1745                        /* Send back a response */
1746                        rc = ibmvscsi_send_crq(hostdata, 0xC002000000000000LL, 0);
1747                        if (rc == 0) {
1748                                /* Now login */
1749                                init_adapter(hostdata);
1750                        } else {
1751                                dev_err(hostdata->dev, "Unable to send init rsp. rc=%ld\n", rc);
1752                        }
1753
1754                        break;
1755                case 0x02:      /* Initialization response */
1756                        dev_info(hostdata->dev, "partner initialization complete\n");
1757
1758                        /* Now login */
1759                        init_adapter(hostdata);
1760                        break;
1761                default:
1762                        dev_err(hostdata->dev, "unknown crq message type: %d\n", crq->format);
1763                }
1764                return;
1765        case 0xFF:      /* Hypervisor telling us the connection is closed */
1766                scsi_block_requests(hostdata->host);
1767                atomic_set(&hostdata->request_limit, 0);
1768                if (crq->format == 0x06) {
1769                        /* We need to re-setup the interpartition connection */
1770                        dev_info(hostdata->dev, "Re-enabling adapter!\n");
1771                        hostdata->client_migrated = 1;
1772                        hostdata->reenable_crq = 1;
1773                        purge_requests(hostdata, DID_REQUEUE);
1774                        wake_up(&hostdata->work_wait_q);
1775                } else {
1776                        dev_err(hostdata->dev, "Virtual adapter failed rc %d!\n",
1777                                crq->format);
1778                        ibmvscsi_reset_host(hostdata);
1779                }
1780                return;
1781        case 0x80:              /* real payload */
1782                break;
1783        default:
1784                dev_err(hostdata->dev, "got an invalid message type 0x%02x\n",
1785                        crq->valid);
1786                return;
1787        }
1788
1789        /* The only kind of payload CRQs we should get are responses to
1790         * things we send. Make sure this response is to something we
1791         * actually sent
1792         */
1793        if (!valid_event_struct(&hostdata->pool, evt_struct)) {
1794                dev_err(hostdata->dev, "returned correlation_token 0x%p is invalid!\n",
1795                       (void *)crq->IU_data_ptr);
1796                return;
1797        }
1798
1799        if (atomic_read(&evt_struct->free)) {
1800                dev_err(hostdata->dev, "received duplicate correlation_token 0x%p!\n",
1801                        (void *)crq->IU_data_ptr);
1802                return;
1803        }
1804
1805        if (crq->format == VIOSRP_SRP_FORMAT)
1806                atomic_add(evt_struct->xfer_iu->srp.rsp.req_lim_delta,
1807                           &hostdata->request_limit);
1808
1809        del_timer(&evt_struct->timer);
1810
1811        if ((crq->status != VIOSRP_OK && crq->status != VIOSRP_OK2) && evt_struct->cmnd)
1812                evt_struct->cmnd->result = DID_ERROR << 16;
1813        if (evt_struct->done)
1814                evt_struct->done(evt_struct);
1815        else
1816                dev_err(hostdata->dev, "returned done() is NULL; not running it!\n");
1817
1818        /*
1819         * Lock the host_lock before messing with these structures, since we
1820         * are running in a task context
1821         */
1822        spin_lock_irqsave(evt_struct->hostdata->host->host_lock, flags);
1823        list_del(&evt_struct->list);
1824        free_event_struct(&evt_struct->hostdata->pool, evt_struct);
1825        spin_unlock_irqrestore(evt_struct->hostdata->host->host_lock, flags);
1826}
1827
1828/**
1829 * ibmvscsi_get_host_config: Send the command to the server to get host
1830 * configuration data.  The data is opaque to us.
1831 */
1832static int ibmvscsi_do_host_config(struct ibmvscsi_host_data *hostdata,
1833                                   unsigned char *buffer, int length)
1834{
1835        struct viosrp_host_config *host_config;
1836        struct srp_event_struct *evt_struct;
1837        unsigned long flags;
1838        dma_addr_t addr;
1839        int rc;
1840
1841        evt_struct = get_event_struct(&hostdata->pool);
1842        if (!evt_struct) {
1843                dev_err(hostdata->dev, "couldn't allocate event for HOST_CONFIG!\n");
1844                return -1;
1845        }
1846
1847        init_event_struct(evt_struct,
1848                          sync_completion,
1849                          VIOSRP_MAD_FORMAT,
1850                          info_timeout);
1851
1852        host_config = &evt_struct->iu.mad.host_config;
1853
1854        /* The transport length field is only 16-bit */
1855        length = min(0xffff, length);
1856
1857        /* Set up a lun reset SRP command */
1858        memset(host_config, 0x00, sizeof(*host_config));
1859        host_config->common.type = VIOSRP_HOST_CONFIG_TYPE;
1860        host_config->common.length = length;
1861        host_config->buffer = addr = dma_map_single(hostdata->dev, buffer,
1862                                                    length,
1863                                                    DMA_BIDIRECTIONAL);
1864
1865        if (dma_mapping_error(hostdata->dev, host_config->buffer)) {
1866                if (!firmware_has_feature(FW_FEATURE_CMO))
1867                        dev_err(hostdata->dev,
1868                                "dma_mapping error getting host config\n");
1869                free_event_struct(&hostdata->pool, evt_struct);
1870                return -1;
1871        }
1872
1873        init_completion(&evt_struct->comp);
1874        spin_lock_irqsave(hostdata->host->host_lock, flags);
1875        rc = ibmvscsi_send_srp_event(evt_struct, hostdata, info_timeout * 2);
1876        spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1877        if (rc == 0)
1878                wait_for_completion(&evt_struct->comp);
1879        dma_unmap_single(hostdata->dev, addr, length, DMA_BIDIRECTIONAL);
1880
1881        return rc;
1882}
1883
1884/**
1885 * ibmvscsi_slave_configure: Set the "allow_restart" flag for each disk.
1886 * @sdev:       struct scsi_device device to configure
1887 *
1888 * Enable allow_restart for a device if it is a disk.  Adjust the
1889 * queue_depth here also as is required by the documentation for
1890 * struct scsi_host_template.
1891 */
1892static int ibmvscsi_slave_configure(struct scsi_device *sdev)
1893{
1894        struct Scsi_Host *shost = sdev->host;
1895        unsigned long lock_flags = 0;
1896
1897        spin_lock_irqsave(shost->host_lock, lock_flags);
1898        if (sdev->type == TYPE_DISK) {
1899                sdev->allow_restart = 1;
1900                blk_queue_rq_timeout(sdev->request_queue, 120 * HZ);
1901        }
1902        scsi_adjust_queue_depth(sdev, 0, shost->cmd_per_lun);
1903        spin_unlock_irqrestore(shost->host_lock, lock_flags);
1904        return 0;
1905}
1906
1907/**
1908 * ibmvscsi_change_queue_depth - Change the device's queue depth
1909 * @sdev:       scsi device struct
1910 * @qdepth:     depth to set
1911 * @reason:     calling context
1912 *
1913 * Return value:
1914 *      actual depth set
1915 **/
1916static int ibmvscsi_change_queue_depth(struct scsi_device *sdev, int qdepth,
1917                                       int reason)
1918{
1919        if (reason != SCSI_QDEPTH_DEFAULT)
1920                return -EOPNOTSUPP;
1921
1922        if (qdepth > IBMVSCSI_MAX_CMDS_PER_LUN)
1923                qdepth = IBMVSCSI_MAX_CMDS_PER_LUN;
1924
1925        scsi_adjust_queue_depth(sdev, 0, qdepth);
1926        return sdev->queue_depth;
1927}
1928
1929/* ------------------------------------------------------------
1930 * sysfs attributes
1931 */
1932static ssize_t show_host_vhost_loc(struct device *dev,
1933                                   struct device_attribute *attr, char *buf)
1934{
1935        struct Scsi_Host *shost = class_to_shost(dev);
1936        struct ibmvscsi_host_data *hostdata = shost_priv(shost);
1937        int len;
1938
1939        len = snprintf(buf, sizeof(hostdata->caps.loc), "%s\n",
1940                       hostdata->caps.loc);
1941        return len;
1942}
1943
1944static struct device_attribute ibmvscsi_host_vhost_loc = {
1945        .attr = {
1946                 .name = "vhost_loc",
1947                 .mode = S_IRUGO,
1948                 },
1949        .show = show_host_vhost_loc,
1950};
1951
1952static ssize_t show_host_vhost_name(struct device *dev,
1953                                    struct device_attribute *attr, char *buf)
1954{
1955        struct Scsi_Host *shost = class_to_shost(dev);
1956        struct ibmvscsi_host_data *hostdata = shost_priv(shost);
1957        int len;
1958
1959        len = snprintf(buf, sizeof(hostdata->caps.name), "%s\n",
1960                       hostdata->caps.name);
1961        return len;
1962}
1963
1964static struct device_attribute ibmvscsi_host_vhost_name = {
1965        .attr = {
1966                 .name = "vhost_name",
1967                 .mode = S_IRUGO,
1968                 },
1969        .show = show_host_vhost_name,
1970};
1971
1972static ssize_t show_host_srp_version(struct device *dev,
1973                                     struct device_attribute *attr, char *buf)
1974{
1975        struct Scsi_Host *shost = class_to_shost(dev);
1976        struct ibmvscsi_host_data *hostdata = shost_priv(shost);
1977        int len;
1978
1979        len = snprintf(buf, PAGE_SIZE, "%s\n",
1980                       hostdata->madapter_info.srp_version);
1981        return len;
1982}
1983
1984static struct device_attribute ibmvscsi_host_srp_version = {
1985        .attr = {
1986                 .name = "srp_version",
1987                 .mode = S_IRUGO,
1988                 },
1989        .show = show_host_srp_version,
1990};
1991
1992static ssize_t show_host_partition_name(struct device *dev,
1993                                        struct device_attribute *attr,
1994                                        char *buf)
1995{
1996        struct Scsi_Host *shost = class_to_shost(dev);
1997        struct ibmvscsi_host_data *hostdata = shost_priv(shost);
1998        int len;
1999
2000        len = snprintf(buf, PAGE_SIZE, "%s\n",
2001                       hostdata->madapter_info.partition_name);
2002        return len;
2003}
2004
2005static struct device_attribute ibmvscsi_host_partition_name = {
2006        .attr = {
2007                 .name = "partition_name",
2008                 .mode = S_IRUGO,
2009                 },
2010        .show = show_host_partition_name,
2011};
2012
2013static ssize_t show_host_partition_number(struct device *dev,
2014                                          struct device_attribute *attr,
2015                                          char *buf)
2016{
2017        struct Scsi_Host *shost = class_to_shost(dev);
2018        struct ibmvscsi_host_data *hostdata = shost_priv(shost);
2019        int len;
2020
2021        len = snprintf(buf, PAGE_SIZE, "%d\n",
2022                       hostdata->madapter_info.partition_number);
2023        return len;
2024}
2025
2026static struct device_attribute ibmvscsi_host_partition_number = {
2027        .attr = {
2028                 .name = "partition_number",
2029                 .mode = S_IRUGO,
2030                 },
2031        .show = show_host_partition_number,
2032};
2033
2034static ssize_t show_host_mad_version(struct device *dev,
2035                                     struct device_attribute *attr, char *buf)
2036{
2037        struct Scsi_Host *shost = class_to_shost(dev);
2038        struct ibmvscsi_host_data *hostdata = shost_priv(shost);
2039        int len;
2040
2041        len = snprintf(buf, PAGE_SIZE, "%d\n",
2042                       hostdata->madapter_info.mad_version);
2043        return len;
2044}
2045
2046static struct device_attribute ibmvscsi_host_mad_version = {
2047        .attr = {
2048                 .name = "mad_version",
2049                 .mode = S_IRUGO,
2050                 },
2051        .show = show_host_mad_version,
2052};
2053
2054static ssize_t show_host_os_type(struct device *dev,
2055                                 struct device_attribute *attr, char *buf)
2056{
2057        struct Scsi_Host *shost = class_to_shost(dev);
2058        struct ibmvscsi_host_data *hostdata = shost_priv(shost);
2059        int len;
2060
2061        len = snprintf(buf, PAGE_SIZE, "%d\n", hostdata->madapter_info.os_type);
2062        return len;
2063}
2064
2065static struct device_attribute ibmvscsi_host_os_type = {
2066        .attr = {
2067                 .name = "os_type",
2068                 .mode = S_IRUGO,
2069                 },
2070        .show = show_host_os_type,
2071};
2072
2073static ssize_t show_host_config(struct device *dev,
2074                                struct device_attribute *attr, char *buf)
2075{
2076        struct Scsi_Host *shost = class_to_shost(dev);
2077        struct ibmvscsi_host_data *hostdata = shost_priv(shost);
2078
2079        /* returns null-terminated host config data */
2080        if (ibmvscsi_do_host_config(hostdata, buf, PAGE_SIZE) == 0)
2081                return strlen(buf);
2082        else
2083                return 0;
2084}
2085
2086static struct device_attribute ibmvscsi_host_config = {
2087        .attr = {
2088                 .name = "config",
2089                 .mode = S_IRUGO,
2090                 },
2091        .show = show_host_config,
2092};
2093
2094static struct device_attribute *ibmvscsi_attrs[] = {
2095        &ibmvscsi_host_vhost_loc,
2096        &ibmvscsi_host_vhost_name,
2097        &ibmvscsi_host_srp_version,
2098        &ibmvscsi_host_partition_name,
2099        &ibmvscsi_host_partition_number,
2100        &ibmvscsi_host_mad_version,
2101        &ibmvscsi_host_os_type,
2102        &ibmvscsi_host_config,
2103        NULL
2104};
2105
2106/* ------------------------------------------------------------
2107 * SCSI driver registration
2108 */
2109static struct scsi_host_template driver_template = {
2110        .module = THIS_MODULE,
2111        .name = "IBM POWER Virtual SCSI Adapter " IBMVSCSI_VERSION,
2112        .proc_name = "ibmvscsi",
2113        .queuecommand = ibmvscsi_queuecommand,
2114        .eh_abort_handler = ibmvscsi_eh_abort_handler,
2115        .eh_device_reset_handler = ibmvscsi_eh_device_reset_handler,
2116        .eh_host_reset_handler = ibmvscsi_eh_host_reset_handler,
2117        .slave_configure = ibmvscsi_slave_configure,
2118        .change_queue_depth = ibmvscsi_change_queue_depth,
2119        .cmd_per_lun = IBMVSCSI_CMDS_PER_LUN_DEFAULT,
2120        .can_queue = IBMVSCSI_MAX_REQUESTS_DEFAULT,
2121        .this_id = -1,
2122        .sg_tablesize = SG_ALL,
2123        .use_clustering = ENABLE_CLUSTERING,
2124        .shost_attrs = ibmvscsi_attrs,
2125};
2126
2127/**
2128 * ibmvscsi_get_desired_dma - Calculate IO memory desired by the driver
2129 *
2130 * @vdev: struct vio_dev for the device whose desired IO mem is to be returned
2131 *
2132 * Return value:
2133 *      Number of bytes of IO data the driver will need to perform well.
2134 */
2135static unsigned long ibmvscsi_get_desired_dma(struct vio_dev *vdev)
2136{
2137        /* iu_storage data allocated in initialize_event_pool */
2138        unsigned long desired_io = max_events * sizeof(union viosrp_iu);
2139
2140        /* add io space for sg data */
2141        desired_io += (IBMVSCSI_MAX_SECTORS_DEFAULT * 512 *
2142                             IBMVSCSI_CMDS_PER_LUN_DEFAULT);
2143
2144        return desired_io;
2145}
2146
2147static void ibmvscsi_do_work(struct ibmvscsi_host_data *hostdata)
2148{
2149        int rc;
2150        char *action = "reset";
2151
2152        if (hostdata->reset_crq) {
2153                smp_rmb();
2154                hostdata->reset_crq = 0;
2155
2156                rc = ibmvscsi_reset_crq_queue(&hostdata->queue, hostdata);
2157                if (!rc)
2158                        rc = ibmvscsi_send_crq(hostdata, 0xC001000000000000LL, 0);
2159                vio_enable_interrupts(to_vio_dev(hostdata->dev));
2160        } else if (hostdata->reenable_crq) {
2161                smp_rmb();
2162                action = "enable";
2163                rc = ibmvscsi_reenable_crq_queue(&hostdata->queue, hostdata);
2164                hostdata->reenable_crq = 0;
2165                if (!rc)
2166                        rc = ibmvscsi_send_crq(hostdata, 0xC001000000000000LL, 0);
2167        } else
2168                return;
2169
2170        if (rc) {
2171                atomic_set(&hostdata->request_limit, -1);
2172                dev_err(hostdata->dev, "error after %s\n", action);
2173        }
2174
2175        scsi_unblock_requests(hostdata->host);
2176}
2177
2178static int ibmvscsi_work_to_do(struct ibmvscsi_host_data *hostdata)
2179{
2180        if (kthread_should_stop())
2181                return 1;
2182        else if (hostdata->reset_crq) {
2183                smp_rmb();
2184                return 1;
2185        } else if (hostdata->reenable_crq) {
2186                smp_rmb();
2187                return 1;
2188        }
2189
2190        return 0;
2191}
2192
2193static int ibmvscsi_work(void *data)
2194{
2195        struct ibmvscsi_host_data *hostdata = data;
2196        int rc;
2197
2198        set_user_nice(current, -20);
2199
2200        while (1) {
2201                rc = wait_event_interruptible(hostdata->work_wait_q,
2202                                              ibmvscsi_work_to_do(hostdata));
2203
2204                BUG_ON(rc);
2205
2206                if (kthread_should_stop())
2207                        break;
2208
2209                ibmvscsi_do_work(hostdata);
2210        }
2211
2212        return 0;
2213}
2214
2215/**
2216 * Called by bus code for each adapter
2217 */
2218static int ibmvscsi_probe(struct vio_dev *vdev, const struct vio_device_id *id)
2219{
2220        struct ibmvscsi_host_data *hostdata;
2221        struct Scsi_Host *host;
2222        struct device *dev = &vdev->dev;
2223        struct srp_rport_identifiers ids;
2224        struct srp_rport *rport;
2225        unsigned long wait_switch = 0;
2226        int rc;
2227
2228        dev_set_drvdata(&vdev->dev, NULL);
2229
2230        host = scsi_host_alloc(&driver_template, sizeof(*hostdata));
2231        if (!host) {
2232                dev_err(&vdev->dev, "couldn't allocate host data\n");
2233                goto scsi_host_alloc_failed;
2234        }
2235
2236        host->transportt = ibmvscsi_transport_template;
2237        hostdata = shost_priv(host);
2238        memset(hostdata, 0x00, sizeof(*hostdata));
2239        INIT_LIST_HEAD(&hostdata->sent);
2240        init_waitqueue_head(&hostdata->work_wait_q);
2241        hostdata->host = host;
2242        hostdata->dev = dev;
2243        atomic_set(&hostdata->request_limit, -1);
2244        hostdata->host->max_sectors = IBMVSCSI_MAX_SECTORS_DEFAULT;
2245
2246        if (map_persist_bufs(hostdata)) {
2247                dev_err(&vdev->dev, "couldn't map persistent buffers\n");
2248                goto persist_bufs_failed;
2249        }
2250
2251        hostdata->work_thread = kthread_run(ibmvscsi_work, hostdata, "%s_%d",
2252                                            "ibmvscsi", host->host_no);
2253
2254        if (IS_ERR(hostdata->work_thread)) {
2255                dev_err(&vdev->dev, "couldn't initialize kthread. rc=%ld\n",
2256                        PTR_ERR(hostdata->work_thread));
2257                goto init_crq_failed;
2258        }
2259
2260        rc = ibmvscsi_init_crq_queue(&hostdata->queue, hostdata, max_events);
2261        if (rc != 0 && rc != H_RESOURCE) {
2262                dev_err(&vdev->dev, "couldn't initialize crq. rc=%d\n", rc);
2263                goto kill_kthread;
2264        }
2265        if (initialize_event_pool(&hostdata->pool, max_events, hostdata) != 0) {
2266                dev_err(&vdev->dev, "couldn't initialize event pool\n");
2267                goto init_pool_failed;
2268        }
2269
2270        host->max_lun = 8;
2271        host->max_id = max_id;
2272        host->max_channel = max_channel;
2273        host->max_cmd_len = 16;
2274
2275        if (scsi_add_host(hostdata->host, hostdata->dev))
2276                goto add_host_failed;
2277
2278        /* we don't have a proper target_port_id so let's use the fake one */
2279        memcpy(ids.port_id, hostdata->madapter_info.partition_name,
2280               sizeof(ids.port_id));
2281        ids.roles = SRP_RPORT_ROLE_TARGET;
2282        rport = srp_rport_add(host, &ids);
2283        if (IS_ERR(rport))
2284                goto add_srp_port_failed;
2285
2286        /* Try to send an initialization message.  Note that this is allowed
2287         * to fail if the other end is not acive.  In that case we don't
2288         * want to scan
2289         */
2290        if (ibmvscsi_send_crq(hostdata, 0xC001000000000000LL, 0) == 0
2291            || rc == H_RESOURCE) {
2292                /*
2293                 * Wait around max init_timeout secs for the adapter to finish
2294                 * initializing. When we are done initializing, we will have a
2295                 * valid request_limit.  We don't want Linux scanning before
2296                 * we are ready.
2297                 */
2298                for (wait_switch = jiffies + (init_timeout * HZ);
2299                     time_before(jiffies, wait_switch) &&
2300                     atomic_read(&hostdata->request_limit) < 2;) {
2301
2302                        msleep(10);
2303                }
2304
2305                /* if we now have a valid request_limit, initiate a scan */
2306                if (atomic_read(&hostdata->request_limit) > 0)
2307                        scsi_scan_host(host);
2308        }
2309
2310        dev_set_drvdata(&vdev->dev, hostdata);
2311        return 0;
2312
2313      add_srp_port_failed:
2314        scsi_remove_host(hostdata->host);
2315      add_host_failed:
2316        release_event_pool(&hostdata->pool, hostdata);
2317      init_pool_failed:
2318        ibmvscsi_release_crq_queue(&hostdata->queue, hostdata, max_events);
2319      kill_kthread:
2320      kthread_stop(hostdata->work_thread);
2321      init_crq_failed:
2322        unmap_persist_bufs(hostdata);
2323      persist_bufs_failed:
2324        scsi_host_put(host);
2325      scsi_host_alloc_failed:
2326        return -1;
2327}
2328
2329static int ibmvscsi_remove(struct vio_dev *vdev)
2330{
2331        struct ibmvscsi_host_data *hostdata = dev_get_drvdata(&vdev->dev);
2332        unmap_persist_bufs(hostdata);
2333        release_event_pool(&hostdata->pool, hostdata);
2334        ibmvscsi_release_crq_queue(&hostdata->queue, hostdata,
2335                                        max_events);
2336
2337        kthread_stop(hostdata->work_thread);
2338        srp_remove_host(hostdata->host);
2339        scsi_remove_host(hostdata->host);
2340        scsi_host_put(hostdata->host);
2341
2342        return 0;
2343}
2344
2345/**
2346 * ibmvscsi_resume: Resume from suspend
2347 * @dev:        device struct
2348 *
2349 * We may have lost an interrupt across suspend/resume, so kick the
2350 * interrupt handler
2351 */
2352static int ibmvscsi_resume(struct device *dev)
2353{
2354        struct ibmvscsi_host_data *hostdata = dev_get_drvdata(dev);
2355        vio_disable_interrupts(to_vio_dev(hostdata->dev));
2356        tasklet_schedule(&hostdata->srp_task);
2357
2358        return 0;
2359}
2360
2361/**
2362 * ibmvscsi_device_table: Used by vio.c to match devices in the device tree we 
2363 * support.
2364 */
2365static struct vio_device_id ibmvscsi_device_table[] __devinitdata = {
2366        {"vscsi", "IBM,v-scsi"},
2367        { "", "" }
2368};
2369MODULE_DEVICE_TABLE(vio, ibmvscsi_device_table);
2370
2371static struct dev_pm_ops ibmvscsi_pm_ops = {
2372        .resume = ibmvscsi_resume
2373};
2374
2375static struct vio_driver ibmvscsi_driver = {
2376        .id_table = ibmvscsi_device_table,
2377        .probe = ibmvscsi_probe,
2378        .remove = ibmvscsi_remove,
2379        .get_desired_dma = ibmvscsi_get_desired_dma,
2380        .name = "ibmvscsi",
2381        .pm = &ibmvscsi_pm_ops,
2382};
2383
2384static struct srp_function_template ibmvscsi_transport_functions = {
2385};
2386
2387int __init ibmvscsi_module_init(void)
2388{
2389        int ret;
2390
2391        /* Ensure we have two requests to do error recovery */
2392        driver_template.can_queue = max_requests;
2393        max_events = max_requests + 2;
2394
2395        if (!firmware_has_feature(FW_FEATURE_VIO))
2396                return -ENODEV;
2397
2398        ibmvscsi_transport_template =
2399                srp_attach_transport(&ibmvscsi_transport_functions);
2400        if (!ibmvscsi_transport_template)
2401                return -ENOMEM;
2402
2403        ret = vio_register_driver(&ibmvscsi_driver);
2404        if (ret)
2405                srp_release_transport(ibmvscsi_transport_template);
2406        return ret;
2407}
2408
2409void __exit ibmvscsi_module_exit(void)
2410{
2411        vio_unregister_driver(&ibmvscsi_driver);
2412        srp_release_transport(ibmvscsi_transport_template);
2413}
2414
2415module_init(ibmvscsi_module_init);
2416module_exit(ibmvscsi_module_exit);
2417