Linux Audio

Check our new training course

Linux debugging, profiling, tracing and performance analysis training

Mar 24-27, 2025, special US time zones
Register
Loading...
v4.10.11
   1/* ------------------------------------------------------------
   2 * ibmvscsi.c
   3 * (C) Copyright IBM Corporation 1994, 2004
   4 * Authors: Colin DeVilbiss (devilbis@us.ibm.com)
   5 *          Santiago Leon (santil@us.ibm.com)
   6 *          Dave Boutcher (sleddog@us.ibm.com)
   7 *
   8 * This program is free software; you can redistribute it and/or modify
   9 * it under the terms of the GNU General Public License as published by
  10 * the Free Software Foundation; either version 2 of the License, or
  11 * (at your option) any later version.
  12 *
  13 * This program is distributed in the hope that it will be useful,
  14 * but WITHOUT ANY WARRANTY; without even the implied warranty of
  15 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
  16 * GNU General Public License for more details.
  17 *
  18 * You should have received a copy of the GNU General Public License
  19 * along with this program; if not, write to the Free Software
  20 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307
  21 * USA
  22 *
  23 * ------------------------------------------------------------
  24 * Emulation of a SCSI host adapter for Virtual I/O devices
  25 *
  26 * This driver supports the SCSI adapter implemented by the IBM
  27 * Power5 firmware.  That SCSI adapter is not a physical adapter,
  28 * but allows Linux SCSI peripheral drivers to directly
  29 * access devices in another logical partition on the physical system.
  30 *
  31 * The virtual adapter(s) are present in the open firmware device
  32 * tree just like real adapters.
  33 *
  34 * One of the capabilities provided on these systems is the ability
  35 * to DMA between partitions.  The architecture states that for VSCSI,
  36 * the server side is allowed to DMA to and from the client.  The client
  37 * is never trusted to DMA to or from the server directly.
  38 *
  39 * Messages are sent between partitions on a "Command/Response Queue" 
  40 * (CRQ), which is just a buffer of 16 byte entries in the receiver's 
  41 * Senders cannot access the buffer directly, but send messages by
  42 * making a hypervisor call and passing in the 16 bytes.  The hypervisor
  43 * puts the message in the next 16 byte space in round-robin fashion,
  44 * turns on the high order bit of the message (the valid bit), and 
  45 * generates an interrupt to the receiver (if interrupts are turned on.) 
  46 * The receiver just turns off the valid bit when they have copied out
  47 * the message.
  48 *
  49 * The VSCSI client builds a SCSI Remote Protocol (SRP) Information Unit
  50 * (IU) (as defined in the T10 standard available at www.t10.org), gets 
  51 * a DMA address for the message, and sends it to the server as the
  52 * payload of a CRQ message.  The server DMAs the SRP IU and processes it,
  53 * including doing any additional data transfers.  When it is done, it
  54 * DMAs the SRP response back to the same address as the request came from,
  55 * and sends a CRQ message back to inform the client that the request has
  56 * completed.
  57 *
  58 * TODO: This is currently pretty tied to the IBM pSeries hypervisor
  59 * interfaces.  It would be really nice to abstract this above an RDMA
  60 * layer.
  61 */
  62
  63#include <linux/module.h>
  64#include <linux/moduleparam.h>
  65#include <linux/dma-mapping.h>
  66#include <linux/delay.h>
  67#include <linux/slab.h>
  68#include <linux/of.h>
  69#include <linux/pm.h>
  70#include <linux/kthread.h>
  71#include <asm/firmware.h>
  72#include <asm/vio.h>
  73#include <scsi/scsi.h>
  74#include <scsi/scsi_cmnd.h>
  75#include <scsi/scsi_host.h>
  76#include <scsi/scsi_device.h>
  77#include <scsi/scsi_transport_srp.h>
  78#include "ibmvscsi.h"
  79
  80/* The values below are somewhat arbitrary default values, but 
  81 * OS/400 will use 3 busses (disks, CDs, tapes, I think.)
  82 * Note that there are 3 bits of channel value, 6 bits of id, and
  83 * 5 bits of LUN.
  84 */
  85static int max_id = 64;
  86static int max_channel = 3;
  87static int init_timeout = 300;
  88static int login_timeout = 60;
  89static int info_timeout = 30;
  90static int abort_timeout = 60;
  91static int reset_timeout = 60;
  92static int max_requests = IBMVSCSI_MAX_REQUESTS_DEFAULT;
  93static int max_events = IBMVSCSI_MAX_REQUESTS_DEFAULT + 2;
  94static int fast_fail = 1;
  95static int client_reserve = 1;
  96static char partition_name[97] = "UNKNOWN";
  97static unsigned int partition_number = -1;
  98static LIST_HEAD(ibmvscsi_head);
  99
 100static struct scsi_transport_template *ibmvscsi_transport_template;
 101
 102#define IBMVSCSI_VERSION "1.5.9"
 103
 104MODULE_DESCRIPTION("IBM Virtual SCSI");
 105MODULE_AUTHOR("Dave Boutcher");
 106MODULE_LICENSE("GPL");
 107MODULE_VERSION(IBMVSCSI_VERSION);
 108
 109module_param_named(max_id, max_id, int, S_IRUGO | S_IWUSR);
 110MODULE_PARM_DESC(max_id, "Largest ID value for each channel [Default=64]");
 111module_param_named(max_channel, max_channel, int, S_IRUGO | S_IWUSR);
 112MODULE_PARM_DESC(max_channel, "Largest channel value [Default=3]");
 113module_param_named(init_timeout, init_timeout, int, S_IRUGO | S_IWUSR);
 114MODULE_PARM_DESC(init_timeout, "Initialization timeout in seconds");
 115module_param_named(max_requests, max_requests, int, S_IRUGO);
 116MODULE_PARM_DESC(max_requests, "Maximum requests for this adapter");
 117module_param_named(fast_fail, fast_fail, int, S_IRUGO | S_IWUSR);
 118MODULE_PARM_DESC(fast_fail, "Enable fast fail. [Default=1]");
 119module_param_named(client_reserve, client_reserve, int, S_IRUGO );
 120MODULE_PARM_DESC(client_reserve, "Attempt client managed reserve/release");
 121
 122static void ibmvscsi_handle_crq(struct viosrp_crq *crq,
 123				struct ibmvscsi_host_data *hostdata);
 124
 125/* ------------------------------------------------------------
 126 * Routines for managing the command/response queue
 127 */
 128/**
 129 * ibmvscsi_handle_event: - Interrupt handler for crq events
 130 * @irq:	number of irq to handle, not used
 131 * @dev_instance: ibmvscsi_host_data of host that received interrupt
 132 *
 133 * Disables interrupts and schedules srp_task
 134 * Always returns IRQ_HANDLED
 135 */
 136static irqreturn_t ibmvscsi_handle_event(int irq, void *dev_instance)
 137{
 138	struct ibmvscsi_host_data *hostdata =
 139	    (struct ibmvscsi_host_data *)dev_instance;
 140	vio_disable_interrupts(to_vio_dev(hostdata->dev));
 141	tasklet_schedule(&hostdata->srp_task);
 142	return IRQ_HANDLED;
 143}
 144
 145/**
 146 * release_crq_queue: - Deallocates data and unregisters CRQ
 147 * @queue:	crq_queue to initialize and register
 148 * @host_data:	ibmvscsi_host_data of host
 149 *
 150 * Frees irq, deallocates a page for messages, unmaps dma, and unregisters
 151 * the crq with the hypervisor.
 152 */
 153static void ibmvscsi_release_crq_queue(struct crq_queue *queue,
 154				       struct ibmvscsi_host_data *hostdata,
 155				       int max_requests)
 156{
 157	long rc = 0;
 158	struct vio_dev *vdev = to_vio_dev(hostdata->dev);
 159	free_irq(vdev->irq, (void *)hostdata);
 160	tasklet_kill(&hostdata->srp_task);
 161	do {
 162		if (rc)
 163			msleep(100);
 164		rc = plpar_hcall_norets(H_FREE_CRQ, vdev->unit_address);
 165	} while ((rc == H_BUSY) || (H_IS_LONG_BUSY(rc)));
 166	dma_unmap_single(hostdata->dev,
 167			 queue->msg_token,
 168			 queue->size * sizeof(*queue->msgs), DMA_BIDIRECTIONAL);
 169	free_page((unsigned long)queue->msgs);
 170}
 171
 172/**
 173 * crq_queue_next_crq: - Returns the next entry in message queue
 174 * @queue:	crq_queue to use
 175 *
 176 * Returns pointer to next entry in queue, or NULL if there are no new
 177 * entried in the CRQ.
 178 */
 179static struct viosrp_crq *crq_queue_next_crq(struct crq_queue *queue)
 180{
 181	struct viosrp_crq *crq;
 182	unsigned long flags;
 183
 184	spin_lock_irqsave(&queue->lock, flags);
 185	crq = &queue->msgs[queue->cur];
 186	if (crq->valid != VIOSRP_CRQ_FREE) {
 187		if (++queue->cur == queue->size)
 188			queue->cur = 0;
 189
 190		/* Ensure the read of the valid bit occurs before reading any
 191		 * other bits of the CRQ entry
 192		 */
 193		rmb();
 194	} else
 195		crq = NULL;
 196	spin_unlock_irqrestore(&queue->lock, flags);
 197
 198	return crq;
 199}
 200
 201/**
 202 * ibmvscsi_send_crq: - Send a CRQ
 203 * @hostdata:	the adapter
 204 * @word1:	the first 64 bits of the data
 205 * @word2:	the second 64 bits of the data
 206 */
 207static int ibmvscsi_send_crq(struct ibmvscsi_host_data *hostdata,
 208			     u64 word1, u64 word2)
 209{
 210	struct vio_dev *vdev = to_vio_dev(hostdata->dev);
 211
 212	/*
 213	 * Ensure the command buffer is flushed to memory before handing it
 214	 * over to the VIOS to prevent it from fetching any stale data.
 215	 */
 216	mb();
 217	return plpar_hcall_norets(H_SEND_CRQ, vdev->unit_address, word1, word2);
 218}
 219
 220/**
 221 * ibmvscsi_task: - Process srps asynchronously
 222 * @data:	ibmvscsi_host_data of host
 223 */
 224static void ibmvscsi_task(void *data)
 225{
 226	struct ibmvscsi_host_data *hostdata = (struct ibmvscsi_host_data *)data;
 227	struct vio_dev *vdev = to_vio_dev(hostdata->dev);
 228	struct viosrp_crq *crq;
 229	int done = 0;
 230
 231	while (!done) {
 232		/* Pull all the valid messages off the CRQ */
 233		while ((crq = crq_queue_next_crq(&hostdata->queue)) != NULL) {
 234			ibmvscsi_handle_crq(crq, hostdata);
 235			crq->valid = VIOSRP_CRQ_FREE;
 236			wmb();
 237		}
 238
 239		vio_enable_interrupts(vdev);
 240		crq = crq_queue_next_crq(&hostdata->queue);
 241		if (crq != NULL) {
 242			vio_disable_interrupts(vdev);
 243			ibmvscsi_handle_crq(crq, hostdata);
 244			crq->valid = VIOSRP_CRQ_FREE;
 245			wmb();
 246		} else {
 247			done = 1;
 248		}
 249	}
 250}
 251
 252static void gather_partition_info(void)
 253{
 254	const char *ppartition_name;
 255	const __be32 *p_number_ptr;
 256
 257	/* Retrieve information about this partition */
 258	if (!of_root)
 259		return;
 260
 261	of_node_get(of_root);
 262
 263	ppartition_name = of_get_property(of_root, "ibm,partition-name", NULL);
 264	if (ppartition_name)
 265		strncpy(partition_name, ppartition_name,
 266				sizeof(partition_name));
 267	p_number_ptr = of_get_property(of_root, "ibm,partition-no", NULL);
 268	if (p_number_ptr)
 269		partition_number = of_read_number(p_number_ptr, 1);
 270	of_node_put(of_root);
 271}
 272
 273static void set_adapter_info(struct ibmvscsi_host_data *hostdata)
 274{
 275	memset(&hostdata->madapter_info, 0x00,
 276			sizeof(hostdata->madapter_info));
 277
 278	dev_info(hostdata->dev, "SRP_VERSION: %s\n", SRP_VERSION);
 279	strcpy(hostdata->madapter_info.srp_version, SRP_VERSION);
 280
 281	strncpy(hostdata->madapter_info.partition_name, partition_name,
 282			sizeof(hostdata->madapter_info.partition_name));
 283
 284	hostdata->madapter_info.partition_number =
 285					cpu_to_be32(partition_number);
 286
 287	hostdata->madapter_info.mad_version = cpu_to_be32(SRP_MAD_VERSION_1);
 288	hostdata->madapter_info.os_type = cpu_to_be32(SRP_MAD_OS_LINUX);
 289}
 290
 291/**
 292 * reset_crq_queue: - resets a crq after a failure
 293 * @queue:	crq_queue to initialize and register
 294 * @hostdata:	ibmvscsi_host_data of host
 295 *
 296 */
 297static int ibmvscsi_reset_crq_queue(struct crq_queue *queue,
 298				    struct ibmvscsi_host_data *hostdata)
 299{
 300	int rc = 0;
 301	struct vio_dev *vdev = to_vio_dev(hostdata->dev);
 302
 303	/* Close the CRQ */
 304	do {
 305		if (rc)
 306			msleep(100);
 307		rc = plpar_hcall_norets(H_FREE_CRQ, vdev->unit_address);
 308	} while ((rc == H_BUSY) || (H_IS_LONG_BUSY(rc)));
 309
 310	/* Clean out the queue */
 311	memset(queue->msgs, 0x00, PAGE_SIZE);
 312	queue->cur = 0;
 313
 314	set_adapter_info(hostdata);
 315
 316	/* And re-open it again */
 317	rc = plpar_hcall_norets(H_REG_CRQ,
 318				vdev->unit_address,
 319				queue->msg_token, PAGE_SIZE);
 320	if (rc == H_CLOSED) {
 321		/* Adapter is good, but other end is not ready */
 322		dev_warn(hostdata->dev, "Partner adapter not ready\n");
 323	} else if (rc != 0) {
 324		dev_warn(hostdata->dev, "couldn't register crq--rc 0x%x\n", rc);
 325	}
 326	return rc;
 327}
 328
 329/**
 330 * initialize_crq_queue: - Initializes and registers CRQ with hypervisor
 331 * @queue:	crq_queue to initialize and register
 332 * @hostdata:	ibmvscsi_host_data of host
 333 *
 334 * Allocates a page for messages, maps it for dma, and registers
 335 * the crq with the hypervisor.
 336 * Returns zero on success.
 337 */
 338static int ibmvscsi_init_crq_queue(struct crq_queue *queue,
 339				   struct ibmvscsi_host_data *hostdata,
 340				   int max_requests)
 341{
 342	int rc;
 343	int retrc;
 344	struct vio_dev *vdev = to_vio_dev(hostdata->dev);
 345
 346	queue->msgs = (struct viosrp_crq *)get_zeroed_page(GFP_KERNEL);
 347
 348	if (!queue->msgs)
 349		goto malloc_failed;
 350	queue->size = PAGE_SIZE / sizeof(*queue->msgs);
 351
 352	queue->msg_token = dma_map_single(hostdata->dev, queue->msgs,
 353					  queue->size * sizeof(*queue->msgs),
 354					  DMA_BIDIRECTIONAL);
 355
 356	if (dma_mapping_error(hostdata->dev, queue->msg_token))
 357		goto map_failed;
 358
 359	gather_partition_info();
 360	set_adapter_info(hostdata);
 361
 362	retrc = rc = plpar_hcall_norets(H_REG_CRQ,
 363				vdev->unit_address,
 364				queue->msg_token, PAGE_SIZE);
 365	if (rc == H_RESOURCE)
 366		/* maybe kexecing and resource is busy. try a reset */
 367		rc = ibmvscsi_reset_crq_queue(queue,
 368					      hostdata);
 369
 370	if (rc == H_CLOSED) {
 371		/* Adapter is good, but other end is not ready */
 372		dev_warn(hostdata->dev, "Partner adapter not ready\n");
 373		retrc = 0;
 374	} else if (rc != 0) {
 375		dev_warn(hostdata->dev, "Error %d opening adapter\n", rc);
 376		goto reg_crq_failed;
 377	}
 378
 379	queue->cur = 0;
 380	spin_lock_init(&queue->lock);
 381
 382	tasklet_init(&hostdata->srp_task, (void *)ibmvscsi_task,
 383		     (unsigned long)hostdata);
 384
 385	if (request_irq(vdev->irq,
 386			ibmvscsi_handle_event,
 387			0, "ibmvscsi", (void *)hostdata) != 0) {
 388		dev_err(hostdata->dev, "couldn't register irq 0x%x\n",
 389			vdev->irq);
 390		goto req_irq_failed;
 391	}
 392
 393	rc = vio_enable_interrupts(vdev);
 394	if (rc != 0) {
 395		dev_err(hostdata->dev, "Error %d enabling interrupts!!!\n", rc);
 396		goto req_irq_failed;
 397	}
 398
 399	return retrc;
 400
 401      req_irq_failed:
 402	tasklet_kill(&hostdata->srp_task);
 403	rc = 0;
 404	do {
 405		if (rc)
 406			msleep(100);
 407		rc = plpar_hcall_norets(H_FREE_CRQ, vdev->unit_address);
 408	} while ((rc == H_BUSY) || (H_IS_LONG_BUSY(rc)));
 409      reg_crq_failed:
 410	dma_unmap_single(hostdata->dev,
 411			 queue->msg_token,
 412			 queue->size * sizeof(*queue->msgs), DMA_BIDIRECTIONAL);
 413      map_failed:
 414	free_page((unsigned long)queue->msgs);
 415      malloc_failed:
 416	return -1;
 417}
 418
 419/**
 420 * reenable_crq_queue: - reenables a crq after
 421 * @queue:	crq_queue to initialize and register
 422 * @hostdata:	ibmvscsi_host_data of host
 423 *
 424 */
 425static int ibmvscsi_reenable_crq_queue(struct crq_queue *queue,
 426				       struct ibmvscsi_host_data *hostdata)
 427{
 428	int rc = 0;
 429	struct vio_dev *vdev = to_vio_dev(hostdata->dev);
 430
 431	/* Re-enable the CRQ */
 432	do {
 433		if (rc)
 434			msleep(100);
 435		rc = plpar_hcall_norets(H_ENABLE_CRQ, vdev->unit_address);
 436	} while ((rc == H_IN_PROGRESS) || (rc == H_BUSY) || (H_IS_LONG_BUSY(rc)));
 437
 438	if (rc)
 439		dev_err(hostdata->dev, "Error %d enabling adapter\n", rc);
 440	return rc;
 441}
 442
 443/* ------------------------------------------------------------
 444 * Routines for the event pool and event structs
 445 */
 446/**
 447 * initialize_event_pool: - Allocates and initializes the event pool for a host
 448 * @pool:	event_pool to be initialized
 449 * @size:	Number of events in pool
 450 * @hostdata:	ibmvscsi_host_data who owns the event pool
 451 *
 452 * Returns zero on success.
 453*/
 454static int initialize_event_pool(struct event_pool *pool,
 455				 int size, struct ibmvscsi_host_data *hostdata)
 456{
 457	int i;
 458
 459	pool->size = size;
 460	pool->next = 0;
 461	pool->events = kcalloc(pool->size, sizeof(*pool->events), GFP_KERNEL);
 462	if (!pool->events)
 463		return -ENOMEM;
 464
 465	pool->iu_storage =
 466	    dma_alloc_coherent(hostdata->dev,
 467			       pool->size * sizeof(*pool->iu_storage),
 468			       &pool->iu_token, 0);
 469	if (!pool->iu_storage) {
 470		kfree(pool->events);
 471		return -ENOMEM;
 472	}
 473
 474	for (i = 0; i < pool->size; ++i) {
 475		struct srp_event_struct *evt = &pool->events[i];
 476		memset(&evt->crq, 0x00, sizeof(evt->crq));
 477		atomic_set(&evt->free, 1);
 478		evt->crq.valid = VIOSRP_CRQ_CMD_RSP;
 479		evt->crq.IU_length = cpu_to_be16(sizeof(*evt->xfer_iu));
 480		evt->crq.IU_data_ptr = cpu_to_be64(pool->iu_token +
 481			sizeof(*evt->xfer_iu) * i);
 482		evt->xfer_iu = pool->iu_storage + i;
 483		evt->hostdata = hostdata;
 484		evt->ext_list = NULL;
 485		evt->ext_list_token = 0;
 486	}
 487
 488	return 0;
 489}
 490
 491/**
 492 * release_event_pool: - Frees memory of an event pool of a host
 493 * @pool:	event_pool to be released
 494 * @hostdata:	ibmvscsi_host_data who owns the even pool
 495 *
 496 * Returns zero on success.
 497*/
 498static void release_event_pool(struct event_pool *pool,
 499			       struct ibmvscsi_host_data *hostdata)
 500{
 501	int i, in_use = 0;
 502	for (i = 0; i < pool->size; ++i) {
 503		if (atomic_read(&pool->events[i].free) != 1)
 504			++in_use;
 505		if (pool->events[i].ext_list) {
 506			dma_free_coherent(hostdata->dev,
 507				  SG_ALL * sizeof(struct srp_direct_buf),
 508				  pool->events[i].ext_list,
 509				  pool->events[i].ext_list_token);
 510		}
 511	}
 512	if (in_use)
 513		dev_warn(hostdata->dev, "releasing event pool with %d "
 514			 "events still in use?\n", in_use);
 515	kfree(pool->events);
 516	dma_free_coherent(hostdata->dev,
 517			  pool->size * sizeof(*pool->iu_storage),
 518			  pool->iu_storage, pool->iu_token);
 519}
 520
 521/**
 522 * valid_event_struct: - Determines if event is valid.
 523 * @pool:	event_pool that contains the event
 524 * @evt:	srp_event_struct to be checked for validity
 525 *
 526 * Returns zero if event is invalid, one otherwise.
 527*/
 528static int valid_event_struct(struct event_pool *pool,
 529				struct srp_event_struct *evt)
 530{
 531	int index = evt - pool->events;
 532	if (index < 0 || index >= pool->size)	/* outside of bounds */
 533		return 0;
 534	if (evt != pool->events + index)	/* unaligned */
 535		return 0;
 536	return 1;
 537}
 538
 539/**
 540 * ibmvscsi_free-event_struct: - Changes status of event to "free"
 541 * @pool:	event_pool that contains the event
 542 * @evt:	srp_event_struct to be modified
 543 *
 544*/
 545static void free_event_struct(struct event_pool *pool,
 546				       struct srp_event_struct *evt)
 547{
 548	if (!valid_event_struct(pool, evt)) {
 549		dev_err(evt->hostdata->dev, "Freeing invalid event_struct %p "
 550			"(not in pool %p)\n", evt, pool->events);
 551		return;
 552	}
 553	if (atomic_inc_return(&evt->free) != 1) {
 554		dev_err(evt->hostdata->dev, "Freeing event_struct %p "
 555			"which is not in use!\n", evt);
 556		return;
 557	}
 558}
 559
 560/**
 561 * get_evt_struct: - Gets the next free event in pool
 562 * @pool:	event_pool that contains the events to be searched
 563 *
 564 * Returns the next event in "free" state, and NULL if none are free.
 565 * Note that no synchronization is done here, we assume the host_lock
 566 * will syncrhonze things.
 567*/
 568static struct srp_event_struct *get_event_struct(struct event_pool *pool)
 569{
 570	int i;
 571	int poolsize = pool->size;
 572	int offset = pool->next;
 573
 574	for (i = 0; i < poolsize; i++) {
 575		offset = (offset + 1) % poolsize;
 576		if (!atomic_dec_if_positive(&pool->events[offset].free)) {
 577			pool->next = offset;
 578			return &pool->events[offset];
 579		}
 580	}
 581
 582	printk(KERN_ERR "ibmvscsi: found no event struct in pool!\n");
 583	return NULL;
 584}
 585
 586/**
 587 * init_event_struct: Initialize fields in an event struct that are always 
 588 *                    required.
 589 * @evt:        The event
 590 * @done:       Routine to call when the event is responded to
 591 * @format:     SRP or MAD format
 592 * @timeout:    timeout value set in the CRQ
 593 */
 594static void init_event_struct(struct srp_event_struct *evt_struct,
 595			      void (*done) (struct srp_event_struct *),
 596			      u8 format,
 597			      int timeout)
 598{
 599	evt_struct->cmnd = NULL;
 600	evt_struct->cmnd_done = NULL;
 601	evt_struct->sync_srp = NULL;
 602	evt_struct->crq.format = format;
 603	evt_struct->crq.timeout = cpu_to_be16(timeout);
 604	evt_struct->done = done;
 605}
 606
 607/* ------------------------------------------------------------
 608 * Routines for receiving SCSI responses from the hosting partition
 609 */
 610
 611/**
 612 * set_srp_direction: Set the fields in the srp related to data
 613 *     direction and number of buffers based on the direction in
 614 *     the scsi_cmnd and the number of buffers
 615 */
 616static void set_srp_direction(struct scsi_cmnd *cmd,
 617			      struct srp_cmd *srp_cmd, 
 618			      int numbuf)
 619{
 620	u8 fmt;
 621
 622	if (numbuf == 0)
 623		return;
 624	
 625	if (numbuf == 1)
 626		fmt = SRP_DATA_DESC_DIRECT;
 627	else {
 628		fmt = SRP_DATA_DESC_INDIRECT;
 629		numbuf = min(numbuf, MAX_INDIRECT_BUFS);
 630
 631		if (cmd->sc_data_direction == DMA_TO_DEVICE)
 632			srp_cmd->data_out_desc_cnt = numbuf;
 633		else
 634			srp_cmd->data_in_desc_cnt = numbuf;
 635	}
 636
 637	if (cmd->sc_data_direction == DMA_TO_DEVICE)
 638		srp_cmd->buf_fmt = fmt << 4;
 639	else
 640		srp_cmd->buf_fmt = fmt;
 641}
 642
 643/**
 644 * unmap_cmd_data: - Unmap data pointed in srp_cmd based on the format
 645 * @cmd:	srp_cmd whose additional_data member will be unmapped
 646 * @dev:	device for which the memory is mapped
 647 *
 648*/
 649static void unmap_cmd_data(struct srp_cmd *cmd,
 650			   struct srp_event_struct *evt_struct,
 651			   struct device *dev)
 652{
 653	u8 out_fmt, in_fmt;
 654
 655	out_fmt = cmd->buf_fmt >> 4;
 656	in_fmt = cmd->buf_fmt & ((1U << 4) - 1);
 657
 658	if (out_fmt == SRP_NO_DATA_DESC && in_fmt == SRP_NO_DATA_DESC)
 659		return;
 660
 661	if (evt_struct->cmnd)
 662		scsi_dma_unmap(evt_struct->cmnd);
 663}
 664
 665static int map_sg_list(struct scsi_cmnd *cmd, int nseg,
 666		       struct srp_direct_buf *md)
 667{
 668	int i;
 669	struct scatterlist *sg;
 670	u64 total_length = 0;
 671
 672	scsi_for_each_sg(cmd, sg, nseg, i) {
 673		struct srp_direct_buf *descr = md + i;
 674		descr->va = cpu_to_be64(sg_dma_address(sg));
 675		descr->len = cpu_to_be32(sg_dma_len(sg));
 676		descr->key = 0;
 677		total_length += sg_dma_len(sg);
 678 	}
 679	return total_length;
 680}
 681
 682/**
 683 * map_sg_data: - Maps dma for a scatterlist and initializes decriptor fields
 684 * @cmd:	Scsi_Cmnd with the scatterlist
 685 * @srp_cmd:	srp_cmd that contains the memory descriptor
 686 * @dev:	device for which to map dma memory
 687 *
 688 * Called by map_data_for_srp_cmd() when building srp cmd from scsi cmd.
 689 * Returns 1 on success.
 690*/
 691static int map_sg_data(struct scsi_cmnd *cmd,
 692		       struct srp_event_struct *evt_struct,
 693		       struct srp_cmd *srp_cmd, struct device *dev)
 694{
 695
 696	int sg_mapped;
 697	u64 total_length = 0;
 698	struct srp_direct_buf *data =
 699		(struct srp_direct_buf *) srp_cmd->add_data;
 700	struct srp_indirect_buf *indirect =
 701		(struct srp_indirect_buf *) data;
 702
 703	sg_mapped = scsi_dma_map(cmd);
 704	if (!sg_mapped)
 705		return 1;
 706	else if (sg_mapped < 0)
 707		return 0;
 708
 709	set_srp_direction(cmd, srp_cmd, sg_mapped);
 710
 711	/* special case; we can use a single direct descriptor */
 712	if (sg_mapped == 1) {
 713		map_sg_list(cmd, sg_mapped, data);
 714		return 1;
 715	}
 716
 717	indirect->table_desc.va = 0;
 718	indirect->table_desc.len = cpu_to_be32(sg_mapped *
 719					       sizeof(struct srp_direct_buf));
 720	indirect->table_desc.key = 0;
 721
 722	if (sg_mapped <= MAX_INDIRECT_BUFS) {
 723		total_length = map_sg_list(cmd, sg_mapped,
 724					   &indirect->desc_list[0]);
 725		indirect->len = cpu_to_be32(total_length);
 726		return 1;
 727	}
 728
 729	/* get indirect table */
 730	if (!evt_struct->ext_list) {
 731		evt_struct->ext_list = (struct srp_direct_buf *)
 732			dma_alloc_coherent(dev,
 733					   SG_ALL * sizeof(struct srp_direct_buf),
 734					   &evt_struct->ext_list_token, 0);
 735		if (!evt_struct->ext_list) {
 736			if (!firmware_has_feature(FW_FEATURE_CMO))
 737				sdev_printk(KERN_ERR, cmd->device,
 738				            "Can't allocate memory "
 739				            "for indirect table\n");
 740			scsi_dma_unmap(cmd);
 741			return 0;
 742		}
 743	}
 744
 745	total_length = map_sg_list(cmd, sg_mapped, evt_struct->ext_list);
 746
 747	indirect->len = cpu_to_be32(total_length);
 748	indirect->table_desc.va = cpu_to_be64(evt_struct->ext_list_token);
 749	indirect->table_desc.len = cpu_to_be32(sg_mapped *
 750					       sizeof(indirect->desc_list[0]));
 751	memcpy(indirect->desc_list, evt_struct->ext_list,
 752	       MAX_INDIRECT_BUFS * sizeof(struct srp_direct_buf));
 753 	return 1;
 754}
 755
 756/**
 757 * map_data_for_srp_cmd: - Calls functions to map data for srp cmds
 758 * @cmd:	struct scsi_cmnd with the memory to be mapped
 759 * @srp_cmd:	srp_cmd that contains the memory descriptor
 760 * @dev:	dma device for which to map dma memory
 761 *
 762 * Called by scsi_cmd_to_srp_cmd() when converting scsi cmds to srp cmds 
 763 * Returns 1 on success.
 764*/
 765static int map_data_for_srp_cmd(struct scsi_cmnd *cmd,
 766				struct srp_event_struct *evt_struct,
 767				struct srp_cmd *srp_cmd, struct device *dev)
 768{
 769	switch (cmd->sc_data_direction) {
 770	case DMA_FROM_DEVICE:
 771	case DMA_TO_DEVICE:
 772		break;
 773	case DMA_NONE:
 774		return 1;
 775	case DMA_BIDIRECTIONAL:
 776		sdev_printk(KERN_ERR, cmd->device,
 777			    "Can't map DMA_BIDIRECTIONAL to read/write\n");
 778		return 0;
 779	default:
 780		sdev_printk(KERN_ERR, cmd->device,
 781			    "Unknown data direction 0x%02x; can't map!\n",
 782			    cmd->sc_data_direction);
 783		return 0;
 784	}
 785
 786	return map_sg_data(cmd, evt_struct, srp_cmd, dev);
 787}
 788
 789/**
 790 * purge_requests: Our virtual adapter just shut down.  purge any sent requests
 791 * @hostdata:    the adapter
 792 */
 793static void purge_requests(struct ibmvscsi_host_data *hostdata, int error_code)
 794{
 795	struct srp_event_struct *evt;
 796	unsigned long flags;
 797
 798	spin_lock_irqsave(hostdata->host->host_lock, flags);
 799	while (!list_empty(&hostdata->sent)) {
 800		evt = list_first_entry(&hostdata->sent, struct srp_event_struct, list);
 801		list_del(&evt->list);
 802		del_timer(&evt->timer);
 803
 804		spin_unlock_irqrestore(hostdata->host->host_lock, flags);
 805		if (evt->cmnd) {
 806			evt->cmnd->result = (error_code << 16);
 807			unmap_cmd_data(&evt->iu.srp.cmd, evt,
 808				       evt->hostdata->dev);
 809			if (evt->cmnd_done)
 810				evt->cmnd_done(evt->cmnd);
 811		} else if (evt->done && evt->crq.format != VIOSRP_MAD_FORMAT &&
 812			   evt->iu.srp.login_req.opcode != SRP_LOGIN_REQ)
 813			evt->done(evt);
 814		free_event_struct(&evt->hostdata->pool, evt);
 815		spin_lock_irqsave(hostdata->host->host_lock, flags);
 816	}
 817	spin_unlock_irqrestore(hostdata->host->host_lock, flags);
 818}
 819
 820/**
 821 * ibmvscsi_reset_host - Reset the connection to the server
 822 * @hostdata:	struct ibmvscsi_host_data to reset
 823*/
 824static void ibmvscsi_reset_host(struct ibmvscsi_host_data *hostdata)
 825{
 826	scsi_block_requests(hostdata->host);
 827	atomic_set(&hostdata->request_limit, 0);
 828
 829	purge_requests(hostdata, DID_ERROR);
 830	hostdata->reset_crq = 1;
 831	wake_up(&hostdata->work_wait_q);
 832}
 833
 834/**
 835 * ibmvscsi_timeout - Internal command timeout handler
 836 * @evt_struct:	struct srp_event_struct that timed out
 837 *
 838 * Called when an internally generated command times out
 839*/
 840static void ibmvscsi_timeout(struct srp_event_struct *evt_struct)
 841{
 
 842	struct ibmvscsi_host_data *hostdata = evt_struct->hostdata;
 843
 844	dev_err(hostdata->dev, "Command timed out (%x). Resetting connection\n",
 845		evt_struct->iu.srp.cmd.opcode);
 846
 847	ibmvscsi_reset_host(hostdata);
 848}
 849
 850
 851/* ------------------------------------------------------------
 852 * Routines for sending and receiving SRPs
 853 */
 854/**
 855 * ibmvscsi_send_srp_event: - Transforms event to u64 array and calls send_crq()
 856 * @evt_struct:	evt_struct to be sent
 857 * @hostdata:	ibmvscsi_host_data of host
 858 * @timeout:	timeout in seconds - 0 means do not time command
 859 *
 860 * Returns the value returned from ibmvscsi_send_crq(). (Zero for success)
 861 * Note that this routine assumes that host_lock is held for synchronization
 862*/
 863static int ibmvscsi_send_srp_event(struct srp_event_struct *evt_struct,
 864				   struct ibmvscsi_host_data *hostdata,
 865				   unsigned long timeout)
 866{
 867	__be64 *crq_as_u64 = (__be64 *)&evt_struct->crq;
 868	int request_status = 0;
 869	int rc;
 870	int srp_req = 0;
 871
 872	/* If we have exhausted our request limit, just fail this request,
 873	 * unless it is for a reset or abort.
 874	 * Note that there are rare cases involving driver generated requests 
 875	 * (such as task management requests) that the mid layer may think we
 876	 * can handle more requests (can_queue) when we actually can't
 877	 */
 878	if (evt_struct->crq.format == VIOSRP_SRP_FORMAT) {
 879		srp_req = 1;
 880		request_status =
 881			atomic_dec_if_positive(&hostdata->request_limit);
 882		/* If request limit was -1 when we started, it is now even
 883		 * less than that
 884		 */
 885		if (request_status < -1)
 886			goto send_error;
 887		/* Otherwise, we may have run out of requests. */
 888		/* If request limit was 0 when we started the adapter is in the
 889		 * process of performing a login with the server adapter, or
 890		 * we may have run out of requests.
 891		 */
 892		else if (request_status == -1 &&
 893		         evt_struct->iu.srp.login_req.opcode != SRP_LOGIN_REQ)
 894			goto send_busy;
 895		/* Abort and reset calls should make it through.
 896		 * Nothing except abort and reset should use the last two
 897		 * slots unless we had two or less to begin with.
 898		 */
 899		else if (request_status < 2 &&
 900		         evt_struct->iu.srp.cmd.opcode != SRP_TSK_MGMT) {
 901			/* In the case that we have less than two requests
 902			 * available, check the server limit as a combination
 903			 * of the request limit and the number of requests
 904			 * in-flight (the size of the send list).  If the
 905			 * server limit is greater than 2, return busy so
 906			 * that the last two are reserved for reset and abort.
 907			 */
 908			int server_limit = request_status;
 909			struct srp_event_struct *tmp_evt;
 910
 911			list_for_each_entry(tmp_evt, &hostdata->sent, list) {
 912				server_limit++;
 913			}
 914
 915			if (server_limit > 2)
 916				goto send_busy;
 917		}
 918	}
 919
 920	/* Copy the IU into the transfer area */
 921	*evt_struct->xfer_iu = evt_struct->iu;
 922	evt_struct->xfer_iu->srp.rsp.tag = (u64)evt_struct;
 923
 924	/* Add this to the sent list.  We need to do this 
 925	 * before we actually send 
 926	 * in case it comes back REALLY fast
 927	 */
 928	list_add_tail(&evt_struct->list, &hostdata->sent);
 929
 930	init_timer(&evt_struct->timer);
 931	if (timeout) {
 932		evt_struct->timer.data = (unsigned long) evt_struct;
 933		evt_struct->timer.expires = jiffies + (timeout * HZ);
 934		evt_struct->timer.function = (void (*)(unsigned long))ibmvscsi_timeout;
 935		add_timer(&evt_struct->timer);
 936	}
 937
 938	rc = ibmvscsi_send_crq(hostdata, be64_to_cpu(crq_as_u64[0]),
 939			       be64_to_cpu(crq_as_u64[1]));
 940	if (rc != 0) {
 941		list_del(&evt_struct->list);
 942		del_timer(&evt_struct->timer);
 943
 944		/* If send_crq returns H_CLOSED, return SCSI_MLQUEUE_HOST_BUSY.
 945		 * Firmware will send a CRQ with a transport event (0xFF) to
 946		 * tell this client what has happened to the transport.  This
 947		 * will be handled in ibmvscsi_handle_crq()
 948		 */
 949		if (rc == H_CLOSED) {
 950			dev_warn(hostdata->dev, "send warning. "
 951			         "Receive queue closed, will retry.\n");
 952			goto send_busy;
 953		}
 954		dev_err(hostdata->dev, "send error %d\n", rc);
 955		if (srp_req)
 956			atomic_inc(&hostdata->request_limit);
 957		goto send_error;
 958	}
 959
 960	return 0;
 961
 962 send_busy:
 963	unmap_cmd_data(&evt_struct->iu.srp.cmd, evt_struct, hostdata->dev);
 964
 965	free_event_struct(&hostdata->pool, evt_struct);
 966	if (srp_req && request_status != -1)
 967		atomic_inc(&hostdata->request_limit);
 968	return SCSI_MLQUEUE_HOST_BUSY;
 969
 970 send_error:
 971	unmap_cmd_data(&evt_struct->iu.srp.cmd, evt_struct, hostdata->dev);
 972
 973	if (evt_struct->cmnd != NULL) {
 974		evt_struct->cmnd->result = DID_ERROR << 16;
 975		evt_struct->cmnd_done(evt_struct->cmnd);
 976	} else if (evt_struct->done)
 977		evt_struct->done(evt_struct);
 978
 979	free_event_struct(&hostdata->pool, evt_struct);
 980	return 0;
 981}
 982
 983/**
 984 * handle_cmd_rsp: -  Handle responses from commands
 985 * @evt_struct:	srp_event_struct to be handled
 986 *
 987 * Used as a callback by when sending scsi cmds.
 988 * Gets called by ibmvscsi_handle_crq()
 989*/
 990static void handle_cmd_rsp(struct srp_event_struct *evt_struct)
 991{
 992	struct srp_rsp *rsp = &evt_struct->xfer_iu->srp.rsp;
 993	struct scsi_cmnd *cmnd = evt_struct->cmnd;
 994
 995	if (unlikely(rsp->opcode != SRP_RSP)) {
 996		if (printk_ratelimit())
 997			dev_warn(evt_struct->hostdata->dev,
 998				 "bad SRP RSP type %#02x\n", rsp->opcode);
 999	}
1000	
1001	if (cmnd) {
1002		cmnd->result |= rsp->status;
1003		if (((cmnd->result >> 1) & 0x1f) == CHECK_CONDITION)
1004			memcpy(cmnd->sense_buffer,
1005			       rsp->data,
1006			       be32_to_cpu(rsp->sense_data_len));
1007		unmap_cmd_data(&evt_struct->iu.srp.cmd, 
1008			       evt_struct, 
1009			       evt_struct->hostdata->dev);
1010
1011		if (rsp->flags & SRP_RSP_FLAG_DOOVER)
1012			scsi_set_resid(cmnd,
1013				       be32_to_cpu(rsp->data_out_res_cnt));
1014		else if (rsp->flags & SRP_RSP_FLAG_DIOVER)
1015			scsi_set_resid(cmnd, be32_to_cpu(rsp->data_in_res_cnt));
1016	}
1017
1018	if (evt_struct->cmnd_done)
1019		evt_struct->cmnd_done(cmnd);
1020}
1021
1022/**
1023 * lun_from_dev: - Returns the lun of the scsi device
1024 * @dev:	struct scsi_device
1025 *
1026*/
1027static inline u16 lun_from_dev(struct scsi_device *dev)
1028{
1029	return (0x2 << 14) | (dev->id << 8) | (dev->channel << 5) | dev->lun;
1030}
1031
1032/**
1033 * ibmvscsi_queue: - The queuecommand function of the scsi template 
1034 * @cmd:	struct scsi_cmnd to be executed
1035 * @done:	Callback function to be called when cmd is completed
1036*/
1037static int ibmvscsi_queuecommand_lck(struct scsi_cmnd *cmnd,
1038				 void (*done) (struct scsi_cmnd *))
1039{
1040	struct srp_cmd *srp_cmd;
1041	struct srp_event_struct *evt_struct;
1042	struct srp_indirect_buf *indirect;
1043	struct ibmvscsi_host_data *hostdata = shost_priv(cmnd->device->host);
1044	u16 lun = lun_from_dev(cmnd->device);
1045	u8 out_fmt, in_fmt;
1046
1047	cmnd->result = (DID_OK << 16);
1048	evt_struct = get_event_struct(&hostdata->pool);
1049	if (!evt_struct)
1050		return SCSI_MLQUEUE_HOST_BUSY;
1051
1052	/* Set up the actual SRP IU */
1053	srp_cmd = &evt_struct->iu.srp.cmd;
1054	memset(srp_cmd, 0x00, SRP_MAX_IU_LEN);
1055	srp_cmd->opcode = SRP_CMD;
1056	memcpy(srp_cmd->cdb, cmnd->cmnd, sizeof(srp_cmd->cdb));
1057	int_to_scsilun(lun, &srp_cmd->lun);
1058
1059	if (!map_data_for_srp_cmd(cmnd, evt_struct, srp_cmd, hostdata->dev)) {
1060		if (!firmware_has_feature(FW_FEATURE_CMO))
1061			sdev_printk(KERN_ERR, cmnd->device,
1062			            "couldn't convert cmd to srp_cmd\n");
1063		free_event_struct(&hostdata->pool, evt_struct);
1064		return SCSI_MLQUEUE_HOST_BUSY;
1065	}
1066
1067	init_event_struct(evt_struct,
1068			  handle_cmd_rsp,
1069			  VIOSRP_SRP_FORMAT,
1070			  cmnd->request->timeout/HZ);
1071
1072	evt_struct->cmnd = cmnd;
1073	evt_struct->cmnd_done = done;
1074
1075	/* Fix up dma address of the buffer itself */
1076	indirect = (struct srp_indirect_buf *) srp_cmd->add_data;
1077	out_fmt = srp_cmd->buf_fmt >> 4;
1078	in_fmt = srp_cmd->buf_fmt & ((1U << 4) - 1);
1079	if ((in_fmt == SRP_DATA_DESC_INDIRECT ||
1080	     out_fmt == SRP_DATA_DESC_INDIRECT) &&
1081	    indirect->table_desc.va == 0) {
1082		indirect->table_desc.va =
1083			cpu_to_be64(be64_to_cpu(evt_struct->crq.IU_data_ptr) +
1084			offsetof(struct srp_cmd, add_data) +
1085			offsetof(struct srp_indirect_buf, desc_list));
1086	}
1087
1088	return ibmvscsi_send_srp_event(evt_struct, hostdata, 0);
1089}
1090
1091static DEF_SCSI_QCMD(ibmvscsi_queuecommand)
1092
1093/* ------------------------------------------------------------
1094 * Routines for driver initialization
1095 */
1096
1097/**
1098 * map_persist_bufs: - Pre-map persistent data for adapter logins
1099 * @hostdata:   ibmvscsi_host_data of host
1100 *
1101 * Map the capabilities and adapter info DMA buffers to avoid runtime failures.
1102 * Return 1 on error, 0 on success.
1103 */
1104static int map_persist_bufs(struct ibmvscsi_host_data *hostdata)
1105{
1106
1107	hostdata->caps_addr = dma_map_single(hostdata->dev, &hostdata->caps,
1108					     sizeof(hostdata->caps), DMA_BIDIRECTIONAL);
1109
1110	if (dma_mapping_error(hostdata->dev, hostdata->caps_addr)) {
1111		dev_err(hostdata->dev, "Unable to map capabilities buffer!\n");
1112		return 1;
1113	}
1114
1115	hostdata->adapter_info_addr = dma_map_single(hostdata->dev,
1116						     &hostdata->madapter_info,
1117						     sizeof(hostdata->madapter_info),
1118						     DMA_BIDIRECTIONAL);
1119	if (dma_mapping_error(hostdata->dev, hostdata->adapter_info_addr)) {
1120		dev_err(hostdata->dev, "Unable to map adapter info buffer!\n");
1121		dma_unmap_single(hostdata->dev, hostdata->caps_addr,
1122				 sizeof(hostdata->caps), DMA_BIDIRECTIONAL);
1123		return 1;
1124	}
1125
1126	return 0;
1127}
1128
1129/**
1130 * unmap_persist_bufs: - Unmap persistent data needed for adapter logins
1131 * @hostdata:   ibmvscsi_host_data of host
1132 *
1133 * Unmap the capabilities and adapter info DMA buffers
1134 */
1135static void unmap_persist_bufs(struct ibmvscsi_host_data *hostdata)
1136{
1137	dma_unmap_single(hostdata->dev, hostdata->caps_addr,
1138			 sizeof(hostdata->caps), DMA_BIDIRECTIONAL);
1139
1140	dma_unmap_single(hostdata->dev, hostdata->adapter_info_addr,
1141			 sizeof(hostdata->madapter_info), DMA_BIDIRECTIONAL);
1142}
1143
1144/**
1145 * login_rsp: - Handle response to SRP login request
1146 * @evt_struct:	srp_event_struct with the response
1147 *
1148 * Used as a "done" callback by when sending srp_login. Gets called
1149 * by ibmvscsi_handle_crq()
1150*/
1151static void login_rsp(struct srp_event_struct *evt_struct)
1152{
1153	struct ibmvscsi_host_data *hostdata = evt_struct->hostdata;
1154	switch (evt_struct->xfer_iu->srp.login_rsp.opcode) {
1155	case SRP_LOGIN_RSP:	/* it worked! */
1156		break;
1157	case SRP_LOGIN_REJ:	/* refused! */
1158		dev_info(hostdata->dev, "SRP_LOGIN_REJ reason %u\n",
1159			 evt_struct->xfer_iu->srp.login_rej.reason);
1160		/* Login failed.  */
1161		atomic_set(&hostdata->request_limit, -1);
1162		return;
1163	default:
1164		dev_err(hostdata->dev, "Invalid login response typecode 0x%02x!\n",
1165			evt_struct->xfer_iu->srp.login_rsp.opcode);
1166		/* Login failed.  */
1167		atomic_set(&hostdata->request_limit, -1);
1168		return;
1169	}
1170
1171	dev_info(hostdata->dev, "SRP_LOGIN succeeded\n");
1172	hostdata->client_migrated = 0;
1173
1174	/* Now we know what the real request-limit is.
1175	 * This value is set rather than added to request_limit because
1176	 * request_limit could have been set to -1 by this client.
1177	 */
1178	atomic_set(&hostdata->request_limit,
1179		   be32_to_cpu(evt_struct->xfer_iu->srp.login_rsp.req_lim_delta));
1180
1181	/* If we had any pending I/Os, kick them */
1182	scsi_unblock_requests(hostdata->host);
1183}
1184
1185/**
1186 * send_srp_login: - Sends the srp login
1187 * @hostdata:	ibmvscsi_host_data of host
1188 *
1189 * Returns zero if successful.
1190*/
1191static int send_srp_login(struct ibmvscsi_host_data *hostdata)
1192{
1193	int rc;
1194	unsigned long flags;
1195	struct srp_login_req *login;
1196	struct srp_event_struct *evt_struct = get_event_struct(&hostdata->pool);
1197
1198	BUG_ON(!evt_struct);
1199	init_event_struct(evt_struct, login_rsp,
1200			  VIOSRP_SRP_FORMAT, login_timeout);
1201
1202	login = &evt_struct->iu.srp.login_req;
1203	memset(login, 0, sizeof(*login));
1204	login->opcode = SRP_LOGIN_REQ;
1205	login->req_it_iu_len = cpu_to_be32(sizeof(union srp_iu));
1206	login->req_buf_fmt = cpu_to_be16(SRP_BUF_FORMAT_DIRECT |
1207					 SRP_BUF_FORMAT_INDIRECT);
1208
1209	spin_lock_irqsave(hostdata->host->host_lock, flags);
1210	/* Start out with a request limit of 0, since this is negotiated in
1211	 * the login request we are just sending and login requests always
1212	 * get sent by the driver regardless of request_limit.
1213	 */
1214	atomic_set(&hostdata->request_limit, 0);
1215
1216	rc = ibmvscsi_send_srp_event(evt_struct, hostdata, login_timeout * 2);
1217	spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1218	dev_info(hostdata->dev, "sent SRP login\n");
1219	return rc;
1220};
1221
1222/**
1223 * capabilities_rsp: - Handle response to MAD adapter capabilities request
1224 * @evt_struct:	srp_event_struct with the response
1225 *
1226 * Used as a "done" callback by when sending adapter_info.
1227 */
1228static void capabilities_rsp(struct srp_event_struct *evt_struct)
1229{
1230	struct ibmvscsi_host_data *hostdata = evt_struct->hostdata;
1231
1232	if (evt_struct->xfer_iu->mad.capabilities.common.status) {
1233		dev_err(hostdata->dev, "error 0x%X getting capabilities info\n",
1234			evt_struct->xfer_iu->mad.capabilities.common.status);
1235	} else {
1236		if (hostdata->caps.migration.common.server_support !=
1237		    cpu_to_be16(SERVER_SUPPORTS_CAP))
1238			dev_info(hostdata->dev, "Partition migration not supported\n");
1239
1240		if (client_reserve) {
1241			if (hostdata->caps.reserve.common.server_support ==
1242			    cpu_to_be16(SERVER_SUPPORTS_CAP))
1243				dev_info(hostdata->dev, "Client reserve enabled\n");
1244			else
1245				dev_info(hostdata->dev, "Client reserve not supported\n");
1246		}
1247	}
1248
1249	send_srp_login(hostdata);
1250}
1251
1252/**
1253 * send_mad_capabilities: - Sends the mad capabilities request
1254 *      and stores the result so it can be retrieved with
1255 * @hostdata:	ibmvscsi_host_data of host
1256 */
1257static void send_mad_capabilities(struct ibmvscsi_host_data *hostdata)
1258{
1259	struct viosrp_capabilities *req;
1260	struct srp_event_struct *evt_struct;
1261	unsigned long flags;
1262	struct device_node *of_node = hostdata->dev->of_node;
1263	const char *location;
1264
1265	evt_struct = get_event_struct(&hostdata->pool);
1266	BUG_ON(!evt_struct);
1267
1268	init_event_struct(evt_struct, capabilities_rsp,
1269			  VIOSRP_MAD_FORMAT, info_timeout);
1270
1271	req = &evt_struct->iu.mad.capabilities;
1272	memset(req, 0, sizeof(*req));
1273
1274	hostdata->caps.flags = cpu_to_be32(CAP_LIST_SUPPORTED);
1275	if (hostdata->client_migrated)
1276		hostdata->caps.flags |= cpu_to_be32(CLIENT_MIGRATED);
1277
1278	strncpy(hostdata->caps.name, dev_name(&hostdata->host->shost_gendev),
1279		sizeof(hostdata->caps.name));
1280	hostdata->caps.name[sizeof(hostdata->caps.name) - 1] = '\0';
1281
1282	location = of_get_property(of_node, "ibm,loc-code", NULL);
1283	location = location ? location : dev_name(hostdata->dev);
1284	strncpy(hostdata->caps.loc, location, sizeof(hostdata->caps.loc));
1285	hostdata->caps.loc[sizeof(hostdata->caps.loc) - 1] = '\0';
1286
1287	req->common.type = cpu_to_be32(VIOSRP_CAPABILITIES_TYPE);
1288	req->buffer = cpu_to_be64(hostdata->caps_addr);
1289
1290	hostdata->caps.migration.common.cap_type =
1291				cpu_to_be32(MIGRATION_CAPABILITIES);
1292	hostdata->caps.migration.common.length =
1293				cpu_to_be16(sizeof(hostdata->caps.migration));
1294	hostdata->caps.migration.common.server_support =
1295				cpu_to_be16(SERVER_SUPPORTS_CAP);
1296	hostdata->caps.migration.ecl = cpu_to_be32(1);
1297
1298	if (client_reserve) {
1299		hostdata->caps.reserve.common.cap_type =
1300					cpu_to_be32(RESERVATION_CAPABILITIES);
1301		hostdata->caps.reserve.common.length =
1302				cpu_to_be16(sizeof(hostdata->caps.reserve));
1303		hostdata->caps.reserve.common.server_support =
1304				cpu_to_be16(SERVER_SUPPORTS_CAP);
1305		hostdata->caps.reserve.type =
1306				cpu_to_be32(CLIENT_RESERVE_SCSI_2);
1307		req->common.length =
1308				cpu_to_be16(sizeof(hostdata->caps));
1309	} else
1310		req->common.length = cpu_to_be16(sizeof(hostdata->caps) -
1311						sizeof(hostdata->caps.reserve));
1312
1313	spin_lock_irqsave(hostdata->host->host_lock, flags);
1314	if (ibmvscsi_send_srp_event(evt_struct, hostdata, info_timeout * 2))
1315		dev_err(hostdata->dev, "couldn't send CAPABILITIES_REQ!\n");
1316	spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1317};
1318
1319/**
1320 * fast_fail_rsp: - Handle response to MAD enable fast fail
1321 * @evt_struct:	srp_event_struct with the response
1322 *
1323 * Used as a "done" callback by when sending enable fast fail. Gets called
1324 * by ibmvscsi_handle_crq()
1325 */
1326static void fast_fail_rsp(struct srp_event_struct *evt_struct)
1327{
1328	struct ibmvscsi_host_data *hostdata = evt_struct->hostdata;
1329	u16 status = be16_to_cpu(evt_struct->xfer_iu->mad.fast_fail.common.status);
1330
1331	if (status == VIOSRP_MAD_NOT_SUPPORTED)
1332		dev_err(hostdata->dev, "fast_fail not supported in server\n");
1333	else if (status == VIOSRP_MAD_FAILED)
1334		dev_err(hostdata->dev, "fast_fail request failed\n");
1335	else if (status != VIOSRP_MAD_SUCCESS)
1336		dev_err(hostdata->dev, "error 0x%X enabling fast_fail\n", status);
1337
1338	send_mad_capabilities(hostdata);
1339}
1340
1341/**
1342 * init_host - Start host initialization
1343 * @hostdata:	ibmvscsi_host_data of host
1344 *
1345 * Returns zero if successful.
1346 */
1347static int enable_fast_fail(struct ibmvscsi_host_data *hostdata)
1348{
1349	int rc;
1350	unsigned long flags;
1351	struct viosrp_fast_fail *fast_fail_mad;
1352	struct srp_event_struct *evt_struct;
1353
1354	if (!fast_fail) {
1355		send_mad_capabilities(hostdata);
1356		return 0;
1357	}
1358
1359	evt_struct = get_event_struct(&hostdata->pool);
1360	BUG_ON(!evt_struct);
1361
1362	init_event_struct(evt_struct, fast_fail_rsp, VIOSRP_MAD_FORMAT, info_timeout);
1363
1364	fast_fail_mad = &evt_struct->iu.mad.fast_fail;
1365	memset(fast_fail_mad, 0, sizeof(*fast_fail_mad));
1366	fast_fail_mad->common.type = cpu_to_be32(VIOSRP_ENABLE_FAST_FAIL);
1367	fast_fail_mad->common.length = cpu_to_be16(sizeof(*fast_fail_mad));
1368
1369	spin_lock_irqsave(hostdata->host->host_lock, flags);
1370	rc = ibmvscsi_send_srp_event(evt_struct, hostdata, info_timeout * 2);
1371	spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1372	return rc;
1373}
1374
1375/**
1376 * adapter_info_rsp: - Handle response to MAD adapter info request
1377 * @evt_struct:	srp_event_struct with the response
1378 *
1379 * Used as a "done" callback by when sending adapter_info. Gets called
1380 * by ibmvscsi_handle_crq()
1381*/
1382static void adapter_info_rsp(struct srp_event_struct *evt_struct)
1383{
1384	struct ibmvscsi_host_data *hostdata = evt_struct->hostdata;
1385
1386	if (evt_struct->xfer_iu->mad.adapter_info.common.status) {
1387		dev_err(hostdata->dev, "error %d getting adapter info\n",
1388			evt_struct->xfer_iu->mad.adapter_info.common.status);
1389	} else {
1390		dev_info(hostdata->dev, "host srp version: %s, "
1391			 "host partition %s (%d), OS %d, max io %u\n",
1392			 hostdata->madapter_info.srp_version,
1393			 hostdata->madapter_info.partition_name,
1394			 be32_to_cpu(hostdata->madapter_info.partition_number),
1395			 be32_to_cpu(hostdata->madapter_info.os_type),
1396			 be32_to_cpu(hostdata->madapter_info.port_max_txu[0]));
1397		
1398		if (hostdata->madapter_info.port_max_txu[0]) 
1399			hostdata->host->max_sectors = 
1400				be32_to_cpu(hostdata->madapter_info.port_max_txu[0]) >> 9;
1401		
1402		if (be32_to_cpu(hostdata->madapter_info.os_type) == SRP_MAD_OS_AIX &&
1403		    strcmp(hostdata->madapter_info.srp_version, "1.6a") <= 0) {
1404			dev_err(hostdata->dev, "host (Ver. %s) doesn't support large transfers\n",
1405				hostdata->madapter_info.srp_version);
1406			dev_err(hostdata->dev, "limiting scatterlists to %d\n",
1407				MAX_INDIRECT_BUFS);
1408			hostdata->host->sg_tablesize = MAX_INDIRECT_BUFS;
1409		}
1410
1411		if (be32_to_cpu(hostdata->madapter_info.os_type) == SRP_MAD_OS_AIX) {
1412			enable_fast_fail(hostdata);
1413			return;
1414		}
1415	}
1416
1417	send_srp_login(hostdata);
1418}
1419
1420/**
1421 * send_mad_adapter_info: - Sends the mad adapter info request
1422 *      and stores the result so it can be retrieved with
1423 *      sysfs.  We COULD consider causing a failure if the
1424 *      returned SRP version doesn't match ours.
1425 * @hostdata:	ibmvscsi_host_data of host
1426 * 
1427 * Returns zero if successful.
1428*/
1429static void send_mad_adapter_info(struct ibmvscsi_host_data *hostdata)
1430{
1431	struct viosrp_adapter_info *req;
1432	struct srp_event_struct *evt_struct;
1433	unsigned long flags;
1434
1435	evt_struct = get_event_struct(&hostdata->pool);
1436	BUG_ON(!evt_struct);
1437
1438	init_event_struct(evt_struct,
1439			  adapter_info_rsp,
1440			  VIOSRP_MAD_FORMAT,
1441			  info_timeout);
1442	
1443	req = &evt_struct->iu.mad.adapter_info;
1444	memset(req, 0x00, sizeof(*req));
1445	
1446	req->common.type = cpu_to_be32(VIOSRP_ADAPTER_INFO_TYPE);
1447	req->common.length = cpu_to_be16(sizeof(hostdata->madapter_info));
1448	req->buffer = cpu_to_be64(hostdata->adapter_info_addr);
1449
1450	spin_lock_irqsave(hostdata->host->host_lock, flags);
1451	if (ibmvscsi_send_srp_event(evt_struct, hostdata, info_timeout * 2))
1452		dev_err(hostdata->dev, "couldn't send ADAPTER_INFO_REQ!\n");
1453	spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1454};
1455
1456/**
1457 * init_adapter: Start virtual adapter initialization sequence
1458 *
1459 */
1460static void init_adapter(struct ibmvscsi_host_data *hostdata)
1461{
1462	send_mad_adapter_info(hostdata);
1463}
1464
1465/**
1466 * sync_completion: Signal that a synchronous command has completed
1467 * Note that after returning from this call, the evt_struct is freed.
1468 * the caller waiting on this completion shouldn't touch the evt_struct
1469 * again.
1470 */
1471static void sync_completion(struct srp_event_struct *evt_struct)
1472{
1473	/* copy the response back */
1474	if (evt_struct->sync_srp)
1475		*evt_struct->sync_srp = *evt_struct->xfer_iu;
1476	
1477	complete(&evt_struct->comp);
1478}
1479
1480/**
1481 * ibmvscsi_abort: Abort a command...from scsi host template
1482 * send this over to the server and wait synchronously for the response
1483 */
1484static int ibmvscsi_eh_abort_handler(struct scsi_cmnd *cmd)
1485{
1486	struct ibmvscsi_host_data *hostdata = shost_priv(cmd->device->host);
1487	struct srp_tsk_mgmt *tsk_mgmt;
1488	struct srp_event_struct *evt;
1489	struct srp_event_struct *tmp_evt, *found_evt;
1490	union viosrp_iu srp_rsp;
1491	int rsp_rc;
1492	unsigned long flags;
1493	u16 lun = lun_from_dev(cmd->device);
1494	unsigned long wait_switch = 0;
1495
1496	/* First, find this command in our sent list so we can figure
1497	 * out the correct tag
1498	 */
1499	spin_lock_irqsave(hostdata->host->host_lock, flags);
1500	wait_switch = jiffies + (init_timeout * HZ);
1501	do {
1502		found_evt = NULL;
1503		list_for_each_entry(tmp_evt, &hostdata->sent, list) {
1504			if (tmp_evt->cmnd == cmd) {
1505				found_evt = tmp_evt;
1506				break;
1507			}
1508		}
1509
1510		if (!found_evt) {
1511			spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1512			return SUCCESS;
1513		}
1514
1515		evt = get_event_struct(&hostdata->pool);
1516		if (evt == NULL) {
1517			spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1518			sdev_printk(KERN_ERR, cmd->device,
1519				"failed to allocate abort event\n");
1520			return FAILED;
1521		}
1522	
1523		init_event_struct(evt,
1524				  sync_completion,
1525				  VIOSRP_SRP_FORMAT,
1526				  abort_timeout);
1527
1528		tsk_mgmt = &evt->iu.srp.tsk_mgmt;
1529	
1530		/* Set up an abort SRP command */
1531		memset(tsk_mgmt, 0x00, sizeof(*tsk_mgmt));
1532		tsk_mgmt->opcode = SRP_TSK_MGMT;
1533		int_to_scsilun(lun, &tsk_mgmt->lun);
1534		tsk_mgmt->tsk_mgmt_func = SRP_TSK_ABORT_TASK;
1535		tsk_mgmt->task_tag = (u64) found_evt;
1536
1537		evt->sync_srp = &srp_rsp;
1538
1539		init_completion(&evt->comp);
1540		rsp_rc = ibmvscsi_send_srp_event(evt, hostdata, abort_timeout * 2);
1541
1542		if (rsp_rc != SCSI_MLQUEUE_HOST_BUSY)
1543			break;
1544
1545		spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1546		msleep(10);
1547		spin_lock_irqsave(hostdata->host->host_lock, flags);
1548	} while (time_before(jiffies, wait_switch));
1549
1550	spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1551
1552	if (rsp_rc != 0) {
1553		sdev_printk(KERN_ERR, cmd->device,
1554			    "failed to send abort() event. rc=%d\n", rsp_rc);
1555		return FAILED;
1556	}
1557
1558	sdev_printk(KERN_INFO, cmd->device,
1559                    "aborting command. lun 0x%llx, tag 0x%llx\n",
1560		    (((u64) lun) << 48), (u64) found_evt);
1561
1562	wait_for_completion(&evt->comp);
1563
1564	/* make sure we got a good response */
1565	if (unlikely(srp_rsp.srp.rsp.opcode != SRP_RSP)) {
1566		if (printk_ratelimit())
1567			sdev_printk(KERN_WARNING, cmd->device, "abort bad SRP RSP type %d\n",
1568				    srp_rsp.srp.rsp.opcode);
1569		return FAILED;
1570	}
1571
1572	if (srp_rsp.srp.rsp.flags & SRP_RSP_FLAG_RSPVALID)
1573		rsp_rc = *((int *)srp_rsp.srp.rsp.data);
1574	else
1575		rsp_rc = srp_rsp.srp.rsp.status;
1576
1577	if (rsp_rc) {
1578		if (printk_ratelimit())
1579			sdev_printk(KERN_WARNING, cmd->device,
1580				    "abort code %d for task tag 0x%llx\n",
1581				    rsp_rc, tsk_mgmt->task_tag);
1582		return FAILED;
1583	}
1584
1585	/* Because we dropped the spinlock above, it's possible
1586	 * The event is no longer in our list.  Make sure it didn't
1587	 * complete while we were aborting
1588	 */
1589	spin_lock_irqsave(hostdata->host->host_lock, flags);
1590	found_evt = NULL;
1591	list_for_each_entry(tmp_evt, &hostdata->sent, list) {
1592		if (tmp_evt->cmnd == cmd) {
1593			found_evt = tmp_evt;
1594			break;
1595		}
1596	}
1597
1598	if (found_evt == NULL) {
1599		spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1600		sdev_printk(KERN_INFO, cmd->device, "aborted task tag 0x%llx completed\n",
1601			    tsk_mgmt->task_tag);
1602		return SUCCESS;
1603	}
1604
1605	sdev_printk(KERN_INFO, cmd->device, "successfully aborted task tag 0x%llx\n",
1606		    tsk_mgmt->task_tag);
1607
1608	cmd->result = (DID_ABORT << 16);
1609	list_del(&found_evt->list);
1610	unmap_cmd_data(&found_evt->iu.srp.cmd, found_evt,
1611		       found_evt->hostdata->dev);
1612	free_event_struct(&found_evt->hostdata->pool, found_evt);
1613	spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1614	atomic_inc(&hostdata->request_limit);
1615	return SUCCESS;
1616}
1617
1618/**
1619 * ibmvscsi_eh_device_reset_handler: Reset a single LUN...from scsi host 
1620 * template send this over to the server and wait synchronously for the 
1621 * response
1622 */
1623static int ibmvscsi_eh_device_reset_handler(struct scsi_cmnd *cmd)
1624{
1625	struct ibmvscsi_host_data *hostdata = shost_priv(cmd->device->host);
1626	struct srp_tsk_mgmt *tsk_mgmt;
1627	struct srp_event_struct *evt;
1628	struct srp_event_struct *tmp_evt, *pos;
1629	union viosrp_iu srp_rsp;
1630	int rsp_rc;
1631	unsigned long flags;
1632	u16 lun = lun_from_dev(cmd->device);
1633	unsigned long wait_switch = 0;
1634
1635	spin_lock_irqsave(hostdata->host->host_lock, flags);
1636	wait_switch = jiffies + (init_timeout * HZ);
1637	do {
1638		evt = get_event_struct(&hostdata->pool);
1639		if (evt == NULL) {
1640			spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1641			sdev_printk(KERN_ERR, cmd->device,
1642				"failed to allocate reset event\n");
1643			return FAILED;
1644		}
1645	
1646		init_event_struct(evt,
1647				  sync_completion,
1648				  VIOSRP_SRP_FORMAT,
1649				  reset_timeout);
1650
1651		tsk_mgmt = &evt->iu.srp.tsk_mgmt;
1652
1653		/* Set up a lun reset SRP command */
1654		memset(tsk_mgmt, 0x00, sizeof(*tsk_mgmt));
1655		tsk_mgmt->opcode = SRP_TSK_MGMT;
1656		int_to_scsilun(lun, &tsk_mgmt->lun);
1657		tsk_mgmt->tsk_mgmt_func = SRP_TSK_LUN_RESET;
1658
1659		evt->sync_srp = &srp_rsp;
1660
1661		init_completion(&evt->comp);
1662		rsp_rc = ibmvscsi_send_srp_event(evt, hostdata, reset_timeout * 2);
1663
1664		if (rsp_rc != SCSI_MLQUEUE_HOST_BUSY)
1665			break;
1666
1667		spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1668		msleep(10);
1669		spin_lock_irqsave(hostdata->host->host_lock, flags);
1670	} while (time_before(jiffies, wait_switch));
1671
1672	spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1673
1674	if (rsp_rc != 0) {
1675		sdev_printk(KERN_ERR, cmd->device,
1676			    "failed to send reset event. rc=%d\n", rsp_rc);
1677		return FAILED;
1678	}
1679
1680	sdev_printk(KERN_INFO, cmd->device, "resetting device. lun 0x%llx\n",
1681		    (((u64) lun) << 48));
1682
1683	wait_for_completion(&evt->comp);
1684
1685	/* make sure we got a good response */
1686	if (unlikely(srp_rsp.srp.rsp.opcode != SRP_RSP)) {
1687		if (printk_ratelimit())
1688			sdev_printk(KERN_WARNING, cmd->device, "reset bad SRP RSP type %d\n",
1689				    srp_rsp.srp.rsp.opcode);
1690		return FAILED;
1691	}
1692
1693	if (srp_rsp.srp.rsp.flags & SRP_RSP_FLAG_RSPVALID)
1694		rsp_rc = *((int *)srp_rsp.srp.rsp.data);
1695	else
1696		rsp_rc = srp_rsp.srp.rsp.status;
1697
1698	if (rsp_rc) {
1699		if (printk_ratelimit())
1700			sdev_printk(KERN_WARNING, cmd->device,
1701				    "reset code %d for task tag 0x%llx\n",
1702				    rsp_rc, tsk_mgmt->task_tag);
1703		return FAILED;
1704	}
1705
1706	/* We need to find all commands for this LUN that have not yet been
1707	 * responded to, and fail them with DID_RESET
1708	 */
1709	spin_lock_irqsave(hostdata->host->host_lock, flags);
1710	list_for_each_entry_safe(tmp_evt, pos, &hostdata->sent, list) {
1711		if ((tmp_evt->cmnd) && (tmp_evt->cmnd->device == cmd->device)) {
1712			if (tmp_evt->cmnd)
1713				tmp_evt->cmnd->result = (DID_RESET << 16);
1714			list_del(&tmp_evt->list);
1715			unmap_cmd_data(&tmp_evt->iu.srp.cmd, tmp_evt,
1716				       tmp_evt->hostdata->dev);
1717			free_event_struct(&tmp_evt->hostdata->pool,
1718						   tmp_evt);
1719			atomic_inc(&hostdata->request_limit);
1720			if (tmp_evt->cmnd_done)
1721				tmp_evt->cmnd_done(tmp_evt->cmnd);
1722			else if (tmp_evt->done)
1723				tmp_evt->done(tmp_evt);
1724		}
1725	}
1726	spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1727	return SUCCESS;
1728}
1729
1730/**
1731 * ibmvscsi_eh_host_reset_handler - Reset the connection to the server
1732 * @cmd:	struct scsi_cmnd having problems
1733*/
1734static int ibmvscsi_eh_host_reset_handler(struct scsi_cmnd *cmd)
1735{
1736	unsigned long wait_switch = 0;
1737	struct ibmvscsi_host_data *hostdata = shost_priv(cmd->device->host);
1738
1739	dev_err(hostdata->dev, "Resetting connection due to error recovery\n");
1740
1741	ibmvscsi_reset_host(hostdata);
1742
1743	for (wait_switch = jiffies + (init_timeout * HZ);
1744	     time_before(jiffies, wait_switch) &&
1745		     atomic_read(&hostdata->request_limit) < 2;) {
1746
1747		msleep(10);
1748	}
1749
1750	if (atomic_read(&hostdata->request_limit) <= 0)
1751		return FAILED;
1752
1753	return SUCCESS;
1754}
1755
1756/**
1757 * ibmvscsi_handle_crq: - Handles and frees received events in the CRQ
1758 * @crq:	Command/Response queue
1759 * @hostdata:	ibmvscsi_host_data of host
1760 *
1761*/
1762static void ibmvscsi_handle_crq(struct viosrp_crq *crq,
1763				struct ibmvscsi_host_data *hostdata)
1764{
1765	long rc;
1766	unsigned long flags;
1767	/* The hypervisor copies our tag value here so no byteswapping */
1768	struct srp_event_struct *evt_struct =
1769			(__force struct srp_event_struct *)crq->IU_data_ptr;
1770	switch (crq->valid) {
1771	case VIOSRP_CRQ_INIT_RSP:		/* initialization */
1772		switch (crq->format) {
1773		case VIOSRP_CRQ_INIT:	/* Initialization message */
1774			dev_info(hostdata->dev, "partner initialized\n");
1775			/* Send back a response */
1776			rc = ibmvscsi_send_crq(hostdata, 0xC002000000000000LL, 0);
1777			if (rc == 0) {
1778				/* Now login */
1779				init_adapter(hostdata);
1780			} else {
1781				dev_err(hostdata->dev, "Unable to send init rsp. rc=%ld\n", rc);
1782			}
1783
1784			break;
1785		case VIOSRP_CRQ_INIT_COMPLETE:	/* Initialization response */
1786			dev_info(hostdata->dev, "partner initialization complete\n");
1787
1788			/* Now login */
1789			init_adapter(hostdata);
1790			break;
1791		default:
1792			dev_err(hostdata->dev, "unknown crq message type: %d\n", crq->format);
1793		}
1794		return;
1795	case VIOSRP_CRQ_XPORT_EVENT:	/* Hypervisor telling us the connection is closed */
1796		scsi_block_requests(hostdata->host);
1797		atomic_set(&hostdata->request_limit, 0);
1798		if (crq->format == 0x06) {
1799			/* We need to re-setup the interpartition connection */
1800			dev_info(hostdata->dev, "Re-enabling adapter!\n");
1801			hostdata->client_migrated = 1;
1802			hostdata->reenable_crq = 1;
1803			purge_requests(hostdata, DID_REQUEUE);
1804			wake_up(&hostdata->work_wait_q);
1805		} else {
1806			dev_err(hostdata->dev, "Virtual adapter failed rc %d!\n",
1807				crq->format);
1808			ibmvscsi_reset_host(hostdata);
1809		}
1810		return;
1811	case VIOSRP_CRQ_CMD_RSP:		/* real payload */
1812		break;
1813	default:
1814		dev_err(hostdata->dev, "got an invalid message type 0x%02x\n",
1815			crq->valid);
1816		return;
1817	}
1818
1819	/* The only kind of payload CRQs we should get are responses to
1820	 * things we send. Make sure this response is to something we
1821	 * actually sent
1822	 */
1823	if (!valid_event_struct(&hostdata->pool, evt_struct)) {
1824		dev_err(hostdata->dev, "returned correlation_token 0x%p is invalid!\n",
1825		       evt_struct);
1826		return;
1827	}
1828
1829	if (atomic_read(&evt_struct->free)) {
1830		dev_err(hostdata->dev, "received duplicate correlation_token 0x%p!\n",
1831			evt_struct);
1832		return;
1833	}
1834
1835	if (crq->format == VIOSRP_SRP_FORMAT)
1836		atomic_add(be32_to_cpu(evt_struct->xfer_iu->srp.rsp.req_lim_delta),
1837			   &hostdata->request_limit);
1838
1839	del_timer(&evt_struct->timer);
1840
1841	if ((crq->status != VIOSRP_OK && crq->status != VIOSRP_OK2) && evt_struct->cmnd)
1842		evt_struct->cmnd->result = DID_ERROR << 16;
1843	if (evt_struct->done)
1844		evt_struct->done(evt_struct);
1845	else
1846		dev_err(hostdata->dev, "returned done() is NULL; not running it!\n");
1847
1848	/*
1849	 * Lock the host_lock before messing with these structures, since we
1850	 * are running in a task context
1851	 */
1852	spin_lock_irqsave(evt_struct->hostdata->host->host_lock, flags);
1853	list_del(&evt_struct->list);
1854	free_event_struct(&evt_struct->hostdata->pool, evt_struct);
1855	spin_unlock_irqrestore(evt_struct->hostdata->host->host_lock, flags);
1856}
1857
1858/**
1859 * ibmvscsi_slave_configure: Set the "allow_restart" flag for each disk.
1860 * @sdev:	struct scsi_device device to configure
1861 *
1862 * Enable allow_restart for a device if it is a disk.  Adjust the
1863 * queue_depth here also as is required by the documentation for
1864 * struct scsi_host_template.
1865 */
1866static int ibmvscsi_slave_configure(struct scsi_device *sdev)
1867{
1868	struct Scsi_Host *shost = sdev->host;
1869	unsigned long lock_flags = 0;
1870
1871	spin_lock_irqsave(shost->host_lock, lock_flags);
1872	if (sdev->type == TYPE_DISK) {
1873		sdev->allow_restart = 1;
1874		blk_queue_rq_timeout(sdev->request_queue, 120 * HZ);
1875	}
1876	spin_unlock_irqrestore(shost->host_lock, lock_flags);
1877	return 0;
1878}
1879
1880/**
1881 * ibmvscsi_change_queue_depth - Change the device's queue depth
1882 * @sdev:	scsi device struct
1883 * @qdepth:	depth to set
1884 * @reason:	calling context
1885 *
1886 * Return value:
1887 * 	actual depth set
1888 **/
1889static int ibmvscsi_change_queue_depth(struct scsi_device *sdev, int qdepth)
1890{
1891	if (qdepth > IBMVSCSI_MAX_CMDS_PER_LUN)
1892		qdepth = IBMVSCSI_MAX_CMDS_PER_LUN;
1893	return scsi_change_queue_depth(sdev, qdepth);
1894}
1895
1896/* ------------------------------------------------------------
1897 * sysfs attributes
1898 */
1899static ssize_t show_host_vhost_loc(struct device *dev,
1900				   struct device_attribute *attr, char *buf)
1901{
1902	struct Scsi_Host *shost = class_to_shost(dev);
1903	struct ibmvscsi_host_data *hostdata = shost_priv(shost);
1904	int len;
1905
1906	len = snprintf(buf, sizeof(hostdata->caps.loc), "%s\n",
1907		       hostdata->caps.loc);
1908	return len;
1909}
1910
1911static struct device_attribute ibmvscsi_host_vhost_loc = {
1912	.attr = {
1913		 .name = "vhost_loc",
1914		 .mode = S_IRUGO,
1915		 },
1916	.show = show_host_vhost_loc,
1917};
1918
1919static ssize_t show_host_vhost_name(struct device *dev,
1920				    struct device_attribute *attr, char *buf)
1921{
1922	struct Scsi_Host *shost = class_to_shost(dev);
1923	struct ibmvscsi_host_data *hostdata = shost_priv(shost);
1924	int len;
1925
1926	len = snprintf(buf, sizeof(hostdata->caps.name), "%s\n",
1927		       hostdata->caps.name);
1928	return len;
1929}
1930
1931static struct device_attribute ibmvscsi_host_vhost_name = {
1932	.attr = {
1933		 .name = "vhost_name",
1934		 .mode = S_IRUGO,
1935		 },
1936	.show = show_host_vhost_name,
1937};
1938
1939static ssize_t show_host_srp_version(struct device *dev,
1940				     struct device_attribute *attr, char *buf)
1941{
1942	struct Scsi_Host *shost = class_to_shost(dev);
1943	struct ibmvscsi_host_data *hostdata = shost_priv(shost);
1944	int len;
1945
1946	len = snprintf(buf, PAGE_SIZE, "%s\n",
1947		       hostdata->madapter_info.srp_version);
1948	return len;
1949}
1950
1951static struct device_attribute ibmvscsi_host_srp_version = {
1952	.attr = {
1953		 .name = "srp_version",
1954		 .mode = S_IRUGO,
1955		 },
1956	.show = show_host_srp_version,
1957};
1958
1959static ssize_t show_host_partition_name(struct device *dev,
1960					struct device_attribute *attr,
1961					char *buf)
1962{
1963	struct Scsi_Host *shost = class_to_shost(dev);
1964	struct ibmvscsi_host_data *hostdata = shost_priv(shost);
1965	int len;
1966
1967	len = snprintf(buf, PAGE_SIZE, "%s\n",
1968		       hostdata->madapter_info.partition_name);
1969	return len;
1970}
1971
1972static struct device_attribute ibmvscsi_host_partition_name = {
1973	.attr = {
1974		 .name = "partition_name",
1975		 .mode = S_IRUGO,
1976		 },
1977	.show = show_host_partition_name,
1978};
1979
1980static ssize_t show_host_partition_number(struct device *dev,
1981					  struct device_attribute *attr,
1982					  char *buf)
1983{
1984	struct Scsi_Host *shost = class_to_shost(dev);
1985	struct ibmvscsi_host_data *hostdata = shost_priv(shost);
1986	int len;
1987
1988	len = snprintf(buf, PAGE_SIZE, "%d\n",
1989		       be32_to_cpu(hostdata->madapter_info.partition_number));
1990	return len;
1991}
1992
1993static struct device_attribute ibmvscsi_host_partition_number = {
1994	.attr = {
1995		 .name = "partition_number",
1996		 .mode = S_IRUGO,
1997		 },
1998	.show = show_host_partition_number,
1999};
2000
2001static ssize_t show_host_mad_version(struct device *dev,
2002				     struct device_attribute *attr, char *buf)
2003{
2004	struct Scsi_Host *shost = class_to_shost(dev);
2005	struct ibmvscsi_host_data *hostdata = shost_priv(shost);
2006	int len;
2007
2008	len = snprintf(buf, PAGE_SIZE, "%d\n",
2009		       be32_to_cpu(hostdata->madapter_info.mad_version));
2010	return len;
2011}
2012
2013static struct device_attribute ibmvscsi_host_mad_version = {
2014	.attr = {
2015		 .name = "mad_version",
2016		 .mode = S_IRUGO,
2017		 },
2018	.show = show_host_mad_version,
2019};
2020
2021static ssize_t show_host_os_type(struct device *dev,
2022				 struct device_attribute *attr, char *buf)
2023{
2024	struct Scsi_Host *shost = class_to_shost(dev);
2025	struct ibmvscsi_host_data *hostdata = shost_priv(shost);
2026	int len;
2027
2028	len = snprintf(buf, PAGE_SIZE, "%d\n",
2029		       be32_to_cpu(hostdata->madapter_info.os_type));
2030	return len;
2031}
2032
2033static struct device_attribute ibmvscsi_host_os_type = {
2034	.attr = {
2035		 .name = "os_type",
2036		 .mode = S_IRUGO,
2037		 },
2038	.show = show_host_os_type,
2039};
2040
2041static ssize_t show_host_config(struct device *dev,
2042				struct device_attribute *attr, char *buf)
2043{
2044	return 0;
2045}
2046
2047static struct device_attribute ibmvscsi_host_config = {
2048	.attr = {
2049		.name = "config",
2050		.mode = S_IRUGO,
2051		},
2052	.show = show_host_config,
2053};
2054
2055static struct device_attribute *ibmvscsi_attrs[] = {
2056	&ibmvscsi_host_vhost_loc,
2057	&ibmvscsi_host_vhost_name,
2058	&ibmvscsi_host_srp_version,
2059	&ibmvscsi_host_partition_name,
2060	&ibmvscsi_host_partition_number,
2061	&ibmvscsi_host_mad_version,
2062	&ibmvscsi_host_os_type,
2063	&ibmvscsi_host_config,
2064	NULL
2065};
2066
2067/* ------------------------------------------------------------
2068 * SCSI driver registration
2069 */
2070static struct scsi_host_template driver_template = {
2071	.module = THIS_MODULE,
2072	.name = "IBM POWER Virtual SCSI Adapter " IBMVSCSI_VERSION,
2073	.proc_name = "ibmvscsi",
2074	.queuecommand = ibmvscsi_queuecommand,
 
2075	.eh_abort_handler = ibmvscsi_eh_abort_handler,
2076	.eh_device_reset_handler = ibmvscsi_eh_device_reset_handler,
2077	.eh_host_reset_handler = ibmvscsi_eh_host_reset_handler,
2078	.slave_configure = ibmvscsi_slave_configure,
2079	.change_queue_depth = ibmvscsi_change_queue_depth,
2080	.cmd_per_lun = IBMVSCSI_CMDS_PER_LUN_DEFAULT,
2081	.can_queue = IBMVSCSI_MAX_REQUESTS_DEFAULT,
2082	.this_id = -1,
2083	.sg_tablesize = SG_ALL,
2084	.use_clustering = ENABLE_CLUSTERING,
2085	.shost_attrs = ibmvscsi_attrs,
2086};
2087
2088/**
2089 * ibmvscsi_get_desired_dma - Calculate IO memory desired by the driver
2090 *
2091 * @vdev: struct vio_dev for the device whose desired IO mem is to be returned
2092 *
2093 * Return value:
2094 *	Number of bytes of IO data the driver will need to perform well.
2095 */
2096static unsigned long ibmvscsi_get_desired_dma(struct vio_dev *vdev)
2097{
2098	/* iu_storage data allocated in initialize_event_pool */
2099	unsigned long desired_io = max_events * sizeof(union viosrp_iu);
2100
2101	/* add io space for sg data */
2102	desired_io += (IBMVSCSI_MAX_SECTORS_DEFAULT * 512 *
2103	                     IBMVSCSI_CMDS_PER_LUN_DEFAULT);
2104
2105	return desired_io;
2106}
2107
2108static void ibmvscsi_do_work(struct ibmvscsi_host_data *hostdata)
2109{
2110	int rc;
2111	char *action = "reset";
2112
2113	if (hostdata->reset_crq) {
2114		smp_rmb();
2115		hostdata->reset_crq = 0;
2116
2117		rc = ibmvscsi_reset_crq_queue(&hostdata->queue, hostdata);
2118		if (!rc)
2119			rc = ibmvscsi_send_crq(hostdata, 0xC001000000000000LL, 0);
2120		vio_enable_interrupts(to_vio_dev(hostdata->dev));
2121	} else if (hostdata->reenable_crq) {
2122		smp_rmb();
2123		action = "enable";
2124		rc = ibmvscsi_reenable_crq_queue(&hostdata->queue, hostdata);
2125		hostdata->reenable_crq = 0;
2126		if (!rc)
2127			rc = ibmvscsi_send_crq(hostdata, 0xC001000000000000LL, 0);
2128	} else
2129		return;
2130
2131	if (rc) {
2132		atomic_set(&hostdata->request_limit, -1);
2133		dev_err(hostdata->dev, "error after %s\n", action);
2134	}
2135
2136	scsi_unblock_requests(hostdata->host);
2137}
2138
2139static int ibmvscsi_work_to_do(struct ibmvscsi_host_data *hostdata)
2140{
2141	if (kthread_should_stop())
2142		return 1;
2143	else if (hostdata->reset_crq) {
2144		smp_rmb();
2145		return 1;
2146	} else if (hostdata->reenable_crq) {
2147		smp_rmb();
2148		return 1;
2149	}
2150
2151	return 0;
2152}
2153
2154static int ibmvscsi_work(void *data)
2155{
2156	struct ibmvscsi_host_data *hostdata = data;
2157	int rc;
2158
2159	set_user_nice(current, MIN_NICE);
2160
2161	while (1) {
2162		rc = wait_event_interruptible(hostdata->work_wait_q,
2163					      ibmvscsi_work_to_do(hostdata));
2164
2165		BUG_ON(rc);
2166
2167		if (kthread_should_stop())
2168			break;
2169
2170		ibmvscsi_do_work(hostdata);
2171	}
2172
2173	return 0;
2174}
2175
2176/**
2177 * Called by bus code for each adapter
2178 */
2179static int ibmvscsi_probe(struct vio_dev *vdev, const struct vio_device_id *id)
2180{
2181	struct ibmvscsi_host_data *hostdata;
2182	struct Scsi_Host *host;
2183	struct device *dev = &vdev->dev;
2184	struct srp_rport_identifiers ids;
2185	struct srp_rport *rport;
2186	unsigned long wait_switch = 0;
2187	int rc;
2188
2189	dev_set_drvdata(&vdev->dev, NULL);
2190
2191	host = scsi_host_alloc(&driver_template, sizeof(*hostdata));
2192	if (!host) {
2193		dev_err(&vdev->dev, "couldn't allocate host data\n");
2194		goto scsi_host_alloc_failed;
2195	}
2196
2197	host->transportt = ibmvscsi_transport_template;
2198	hostdata = shost_priv(host);
2199	memset(hostdata, 0x00, sizeof(*hostdata));
2200	INIT_LIST_HEAD(&hostdata->sent);
2201	init_waitqueue_head(&hostdata->work_wait_q);
2202	hostdata->host = host;
2203	hostdata->dev = dev;
2204	atomic_set(&hostdata->request_limit, -1);
2205	hostdata->host->max_sectors = IBMVSCSI_MAX_SECTORS_DEFAULT;
2206
2207	if (map_persist_bufs(hostdata)) {
2208		dev_err(&vdev->dev, "couldn't map persistent buffers\n");
2209		goto persist_bufs_failed;
2210	}
2211
2212	hostdata->work_thread = kthread_run(ibmvscsi_work, hostdata, "%s_%d",
2213					    "ibmvscsi", host->host_no);
2214
2215	if (IS_ERR(hostdata->work_thread)) {
2216		dev_err(&vdev->dev, "couldn't initialize kthread. rc=%ld\n",
2217			PTR_ERR(hostdata->work_thread));
2218		goto init_crq_failed;
2219	}
2220
2221	rc = ibmvscsi_init_crq_queue(&hostdata->queue, hostdata, max_events);
2222	if (rc != 0 && rc != H_RESOURCE) {
2223		dev_err(&vdev->dev, "couldn't initialize crq. rc=%d\n", rc);
2224		goto kill_kthread;
2225	}
2226	if (initialize_event_pool(&hostdata->pool, max_events, hostdata) != 0) {
2227		dev_err(&vdev->dev, "couldn't initialize event pool\n");
2228		goto init_pool_failed;
2229	}
2230
2231	host->max_lun = IBMVSCSI_MAX_LUN;
2232	host->max_id = max_id;
2233	host->max_channel = max_channel;
2234	host->max_cmd_len = 16;
2235
2236	dev_info(dev,
2237		 "Maximum ID: %d Maximum LUN: %llu Maximum Channel: %d\n",
2238		 host->max_id, host->max_lun, host->max_channel);
2239
2240	if (scsi_add_host(hostdata->host, hostdata->dev))
2241		goto add_host_failed;
2242
2243	/* we don't have a proper target_port_id so let's use the fake one */
2244	memcpy(ids.port_id, hostdata->madapter_info.partition_name,
2245	       sizeof(ids.port_id));
2246	ids.roles = SRP_RPORT_ROLE_TARGET;
2247	rport = srp_rport_add(host, &ids);
2248	if (IS_ERR(rport))
2249		goto add_srp_port_failed;
2250
2251	/* Try to send an initialization message.  Note that this is allowed
2252	 * to fail if the other end is not acive.  In that case we don't
2253	 * want to scan
2254	 */
2255	if (ibmvscsi_send_crq(hostdata, 0xC001000000000000LL, 0) == 0
2256	    || rc == H_RESOURCE) {
2257		/*
2258		 * Wait around max init_timeout secs for the adapter to finish
2259		 * initializing. When we are done initializing, we will have a
2260		 * valid request_limit.  We don't want Linux scanning before
2261		 * we are ready.
2262		 */
2263		for (wait_switch = jiffies + (init_timeout * HZ);
2264		     time_before(jiffies, wait_switch) &&
2265		     atomic_read(&hostdata->request_limit) < 2;) {
2266
2267			msleep(10);
2268		}
2269
2270		/* if we now have a valid request_limit, initiate a scan */
2271		if (atomic_read(&hostdata->request_limit) > 0)
2272			scsi_scan_host(host);
2273	}
2274
2275	dev_set_drvdata(&vdev->dev, hostdata);
2276	list_add_tail(&hostdata->host_list, &ibmvscsi_head);
2277	return 0;
2278
2279      add_srp_port_failed:
2280	scsi_remove_host(hostdata->host);
2281      add_host_failed:
2282	release_event_pool(&hostdata->pool, hostdata);
2283      init_pool_failed:
2284	ibmvscsi_release_crq_queue(&hostdata->queue, hostdata, max_events);
2285      kill_kthread:
2286      kthread_stop(hostdata->work_thread);
2287      init_crq_failed:
2288	unmap_persist_bufs(hostdata);
2289      persist_bufs_failed:
2290	scsi_host_put(host);
2291      scsi_host_alloc_failed:
2292	return -1;
2293}
2294
2295static int ibmvscsi_remove(struct vio_dev *vdev)
2296{
2297	struct ibmvscsi_host_data *hostdata = dev_get_drvdata(&vdev->dev);
2298	list_del(&hostdata->host_list);
2299	unmap_persist_bufs(hostdata);
2300	release_event_pool(&hostdata->pool, hostdata);
2301	ibmvscsi_release_crq_queue(&hostdata->queue, hostdata,
2302					max_events);
2303
2304	kthread_stop(hostdata->work_thread);
2305	srp_remove_host(hostdata->host);
2306	scsi_remove_host(hostdata->host);
2307	scsi_host_put(hostdata->host);
2308
2309	return 0;
2310}
2311
2312/**
2313 * ibmvscsi_resume: Resume from suspend
2314 * @dev:	device struct
2315 *
2316 * We may have lost an interrupt across suspend/resume, so kick the
2317 * interrupt handler
2318 */
2319static int ibmvscsi_resume(struct device *dev)
2320{
2321	struct ibmvscsi_host_data *hostdata = dev_get_drvdata(dev);
2322	vio_disable_interrupts(to_vio_dev(hostdata->dev));
2323	tasklet_schedule(&hostdata->srp_task);
2324
2325	return 0;
2326}
2327
2328/**
2329 * ibmvscsi_device_table: Used by vio.c to match devices in the device tree we 
2330 * support.
2331 */
2332static struct vio_device_id ibmvscsi_device_table[] = {
2333	{"vscsi", "IBM,v-scsi"},
2334	{ "", "" }
2335};
2336MODULE_DEVICE_TABLE(vio, ibmvscsi_device_table);
2337
2338static struct dev_pm_ops ibmvscsi_pm_ops = {
2339	.resume = ibmvscsi_resume
2340};
2341
2342static struct vio_driver ibmvscsi_driver = {
2343	.id_table = ibmvscsi_device_table,
2344	.probe = ibmvscsi_probe,
2345	.remove = ibmvscsi_remove,
2346	.get_desired_dma = ibmvscsi_get_desired_dma,
2347	.name = "ibmvscsi",
2348	.pm = &ibmvscsi_pm_ops,
2349};
2350
2351static struct srp_function_template ibmvscsi_transport_functions = {
2352};
2353
2354int __init ibmvscsi_module_init(void)
2355{
2356	int ret;
2357
2358	/* Ensure we have two requests to do error recovery */
2359	driver_template.can_queue = max_requests;
2360	max_events = max_requests + 2;
2361
2362	if (!firmware_has_feature(FW_FEATURE_VIO))
2363		return -ENODEV;
2364
2365	ibmvscsi_transport_template =
2366		srp_attach_transport(&ibmvscsi_transport_functions);
2367	if (!ibmvscsi_transport_template)
2368		return -ENOMEM;
2369
2370	ret = vio_register_driver(&ibmvscsi_driver);
2371	if (ret)
2372		srp_release_transport(ibmvscsi_transport_template);
2373	return ret;
2374}
2375
2376void __exit ibmvscsi_module_exit(void)
2377{
2378	vio_unregister_driver(&ibmvscsi_driver);
2379	srp_release_transport(ibmvscsi_transport_template);
2380}
2381
2382module_init(ibmvscsi_module_init);
2383module_exit(ibmvscsi_module_exit);
v4.17
   1/* ------------------------------------------------------------
   2 * ibmvscsi.c
   3 * (C) Copyright IBM Corporation 1994, 2004
   4 * Authors: Colin DeVilbiss (devilbis@us.ibm.com)
   5 *          Santiago Leon (santil@us.ibm.com)
   6 *          Dave Boutcher (sleddog@us.ibm.com)
   7 *
   8 * This program is free software; you can redistribute it and/or modify
   9 * it under the terms of the GNU General Public License as published by
  10 * the Free Software Foundation; either version 2 of the License, or
  11 * (at your option) any later version.
  12 *
  13 * This program is distributed in the hope that it will be useful,
  14 * but WITHOUT ANY WARRANTY; without even the implied warranty of
  15 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
  16 * GNU General Public License for more details.
  17 *
  18 * You should have received a copy of the GNU General Public License
  19 * along with this program; if not, write to the Free Software
  20 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307
  21 * USA
  22 *
  23 * ------------------------------------------------------------
  24 * Emulation of a SCSI host adapter for Virtual I/O devices
  25 *
  26 * This driver supports the SCSI adapter implemented by the IBM
  27 * Power5 firmware.  That SCSI adapter is not a physical adapter,
  28 * but allows Linux SCSI peripheral drivers to directly
  29 * access devices in another logical partition on the physical system.
  30 *
  31 * The virtual adapter(s) are present in the open firmware device
  32 * tree just like real adapters.
  33 *
  34 * One of the capabilities provided on these systems is the ability
  35 * to DMA between partitions.  The architecture states that for VSCSI,
  36 * the server side is allowed to DMA to and from the client.  The client
  37 * is never trusted to DMA to or from the server directly.
  38 *
  39 * Messages are sent between partitions on a "Command/Response Queue" 
  40 * (CRQ), which is just a buffer of 16 byte entries in the receiver's 
  41 * Senders cannot access the buffer directly, but send messages by
  42 * making a hypervisor call and passing in the 16 bytes.  The hypervisor
  43 * puts the message in the next 16 byte space in round-robin fashion,
  44 * turns on the high order bit of the message (the valid bit), and 
  45 * generates an interrupt to the receiver (if interrupts are turned on.) 
  46 * The receiver just turns off the valid bit when they have copied out
  47 * the message.
  48 *
  49 * The VSCSI client builds a SCSI Remote Protocol (SRP) Information Unit
  50 * (IU) (as defined in the T10 standard available at www.t10.org), gets 
  51 * a DMA address for the message, and sends it to the server as the
  52 * payload of a CRQ message.  The server DMAs the SRP IU and processes it,
  53 * including doing any additional data transfers.  When it is done, it
  54 * DMAs the SRP response back to the same address as the request came from,
  55 * and sends a CRQ message back to inform the client that the request has
  56 * completed.
  57 *
  58 * TODO: This is currently pretty tied to the IBM pSeries hypervisor
  59 * interfaces.  It would be really nice to abstract this above an RDMA
  60 * layer.
  61 */
  62
  63#include <linux/module.h>
  64#include <linux/moduleparam.h>
  65#include <linux/dma-mapping.h>
  66#include <linux/delay.h>
  67#include <linux/slab.h>
  68#include <linux/of.h>
  69#include <linux/pm.h>
  70#include <linux/kthread.h>
  71#include <asm/firmware.h>
  72#include <asm/vio.h>
  73#include <scsi/scsi.h>
  74#include <scsi/scsi_cmnd.h>
  75#include <scsi/scsi_host.h>
  76#include <scsi/scsi_device.h>
  77#include <scsi/scsi_transport_srp.h>
  78#include "ibmvscsi.h"
  79
  80/* The values below are somewhat arbitrary default values, but 
  81 * OS/400 will use 3 busses (disks, CDs, tapes, I think.)
  82 * Note that there are 3 bits of channel value, 6 bits of id, and
  83 * 5 bits of LUN.
  84 */
  85static int max_id = 64;
  86static int max_channel = 3;
  87static int init_timeout = 300;
  88static int login_timeout = 60;
  89static int info_timeout = 30;
  90static int abort_timeout = 60;
  91static int reset_timeout = 60;
  92static int max_requests = IBMVSCSI_MAX_REQUESTS_DEFAULT;
  93static int max_events = IBMVSCSI_MAX_REQUESTS_DEFAULT + 2;
  94static int fast_fail = 1;
  95static int client_reserve = 1;
  96static char partition_name[97] = "UNKNOWN";
  97static unsigned int partition_number = -1;
  98static LIST_HEAD(ibmvscsi_head);
  99
 100static struct scsi_transport_template *ibmvscsi_transport_template;
 101
 102#define IBMVSCSI_VERSION "1.5.9"
 103
 104MODULE_DESCRIPTION("IBM Virtual SCSI");
 105MODULE_AUTHOR("Dave Boutcher");
 106MODULE_LICENSE("GPL");
 107MODULE_VERSION(IBMVSCSI_VERSION);
 108
 109module_param_named(max_id, max_id, int, S_IRUGO | S_IWUSR);
 110MODULE_PARM_DESC(max_id, "Largest ID value for each channel [Default=64]");
 111module_param_named(max_channel, max_channel, int, S_IRUGO | S_IWUSR);
 112MODULE_PARM_DESC(max_channel, "Largest channel value [Default=3]");
 113module_param_named(init_timeout, init_timeout, int, S_IRUGO | S_IWUSR);
 114MODULE_PARM_DESC(init_timeout, "Initialization timeout in seconds");
 115module_param_named(max_requests, max_requests, int, S_IRUGO);
 116MODULE_PARM_DESC(max_requests, "Maximum requests for this adapter");
 117module_param_named(fast_fail, fast_fail, int, S_IRUGO | S_IWUSR);
 118MODULE_PARM_DESC(fast_fail, "Enable fast fail. [Default=1]");
 119module_param_named(client_reserve, client_reserve, int, S_IRUGO );
 120MODULE_PARM_DESC(client_reserve, "Attempt client managed reserve/release");
 121
 122static void ibmvscsi_handle_crq(struct viosrp_crq *crq,
 123				struct ibmvscsi_host_data *hostdata);
 124
 125/* ------------------------------------------------------------
 126 * Routines for managing the command/response queue
 127 */
 128/**
 129 * ibmvscsi_handle_event: - Interrupt handler for crq events
 130 * @irq:	number of irq to handle, not used
 131 * @dev_instance: ibmvscsi_host_data of host that received interrupt
 132 *
 133 * Disables interrupts and schedules srp_task
 134 * Always returns IRQ_HANDLED
 135 */
 136static irqreturn_t ibmvscsi_handle_event(int irq, void *dev_instance)
 137{
 138	struct ibmvscsi_host_data *hostdata =
 139	    (struct ibmvscsi_host_data *)dev_instance;
 140	vio_disable_interrupts(to_vio_dev(hostdata->dev));
 141	tasklet_schedule(&hostdata->srp_task);
 142	return IRQ_HANDLED;
 143}
 144
 145/**
 146 * release_crq_queue: - Deallocates data and unregisters CRQ
 147 * @queue:	crq_queue to initialize and register
 148 * @host_data:	ibmvscsi_host_data of host
 149 *
 150 * Frees irq, deallocates a page for messages, unmaps dma, and unregisters
 151 * the crq with the hypervisor.
 152 */
 153static void ibmvscsi_release_crq_queue(struct crq_queue *queue,
 154				       struct ibmvscsi_host_data *hostdata,
 155				       int max_requests)
 156{
 157	long rc = 0;
 158	struct vio_dev *vdev = to_vio_dev(hostdata->dev);
 159	free_irq(vdev->irq, (void *)hostdata);
 160	tasklet_kill(&hostdata->srp_task);
 161	do {
 162		if (rc)
 163			msleep(100);
 164		rc = plpar_hcall_norets(H_FREE_CRQ, vdev->unit_address);
 165	} while ((rc == H_BUSY) || (H_IS_LONG_BUSY(rc)));
 166	dma_unmap_single(hostdata->dev,
 167			 queue->msg_token,
 168			 queue->size * sizeof(*queue->msgs), DMA_BIDIRECTIONAL);
 169	free_page((unsigned long)queue->msgs);
 170}
 171
 172/**
 173 * crq_queue_next_crq: - Returns the next entry in message queue
 174 * @queue:	crq_queue to use
 175 *
 176 * Returns pointer to next entry in queue, or NULL if there are no new
 177 * entried in the CRQ.
 178 */
 179static struct viosrp_crq *crq_queue_next_crq(struct crq_queue *queue)
 180{
 181	struct viosrp_crq *crq;
 182	unsigned long flags;
 183
 184	spin_lock_irqsave(&queue->lock, flags);
 185	crq = &queue->msgs[queue->cur];
 186	if (crq->valid != VIOSRP_CRQ_FREE) {
 187		if (++queue->cur == queue->size)
 188			queue->cur = 0;
 189
 190		/* Ensure the read of the valid bit occurs before reading any
 191		 * other bits of the CRQ entry
 192		 */
 193		rmb();
 194	} else
 195		crq = NULL;
 196	spin_unlock_irqrestore(&queue->lock, flags);
 197
 198	return crq;
 199}
 200
 201/**
 202 * ibmvscsi_send_crq: - Send a CRQ
 203 * @hostdata:	the adapter
 204 * @word1:	the first 64 bits of the data
 205 * @word2:	the second 64 bits of the data
 206 */
 207static int ibmvscsi_send_crq(struct ibmvscsi_host_data *hostdata,
 208			     u64 word1, u64 word2)
 209{
 210	struct vio_dev *vdev = to_vio_dev(hostdata->dev);
 211
 212	/*
 213	 * Ensure the command buffer is flushed to memory before handing it
 214	 * over to the VIOS to prevent it from fetching any stale data.
 215	 */
 216	mb();
 217	return plpar_hcall_norets(H_SEND_CRQ, vdev->unit_address, word1, word2);
 218}
 219
 220/**
 221 * ibmvscsi_task: - Process srps asynchronously
 222 * @data:	ibmvscsi_host_data of host
 223 */
 224static void ibmvscsi_task(void *data)
 225{
 226	struct ibmvscsi_host_data *hostdata = (struct ibmvscsi_host_data *)data;
 227	struct vio_dev *vdev = to_vio_dev(hostdata->dev);
 228	struct viosrp_crq *crq;
 229	int done = 0;
 230
 231	while (!done) {
 232		/* Pull all the valid messages off the CRQ */
 233		while ((crq = crq_queue_next_crq(&hostdata->queue)) != NULL) {
 234			ibmvscsi_handle_crq(crq, hostdata);
 235			crq->valid = VIOSRP_CRQ_FREE;
 236			wmb();
 237		}
 238
 239		vio_enable_interrupts(vdev);
 240		crq = crq_queue_next_crq(&hostdata->queue);
 241		if (crq != NULL) {
 242			vio_disable_interrupts(vdev);
 243			ibmvscsi_handle_crq(crq, hostdata);
 244			crq->valid = VIOSRP_CRQ_FREE;
 245			wmb();
 246		} else {
 247			done = 1;
 248		}
 249	}
 250}
 251
 252static void gather_partition_info(void)
 253{
 254	const char *ppartition_name;
 255	const __be32 *p_number_ptr;
 256
 257	/* Retrieve information about this partition */
 258	if (!of_root)
 259		return;
 260
 261	of_node_get(of_root);
 262
 263	ppartition_name = of_get_property(of_root, "ibm,partition-name", NULL);
 264	if (ppartition_name)
 265		strncpy(partition_name, ppartition_name,
 266				sizeof(partition_name));
 267	p_number_ptr = of_get_property(of_root, "ibm,partition-no", NULL);
 268	if (p_number_ptr)
 269		partition_number = of_read_number(p_number_ptr, 1);
 270	of_node_put(of_root);
 271}
 272
 273static void set_adapter_info(struct ibmvscsi_host_data *hostdata)
 274{
 275	memset(&hostdata->madapter_info, 0x00,
 276			sizeof(hostdata->madapter_info));
 277
 278	dev_info(hostdata->dev, "SRP_VERSION: %s\n", SRP_VERSION);
 279	strcpy(hostdata->madapter_info.srp_version, SRP_VERSION);
 280
 281	strncpy(hostdata->madapter_info.partition_name, partition_name,
 282			sizeof(hostdata->madapter_info.partition_name));
 283
 284	hostdata->madapter_info.partition_number =
 285					cpu_to_be32(partition_number);
 286
 287	hostdata->madapter_info.mad_version = cpu_to_be32(SRP_MAD_VERSION_1);
 288	hostdata->madapter_info.os_type = cpu_to_be32(SRP_MAD_OS_LINUX);
 289}
 290
 291/**
 292 * reset_crq_queue: - resets a crq after a failure
 293 * @queue:	crq_queue to initialize and register
 294 * @hostdata:	ibmvscsi_host_data of host
 295 *
 296 */
 297static int ibmvscsi_reset_crq_queue(struct crq_queue *queue,
 298				    struct ibmvscsi_host_data *hostdata)
 299{
 300	int rc = 0;
 301	struct vio_dev *vdev = to_vio_dev(hostdata->dev);
 302
 303	/* Close the CRQ */
 304	do {
 305		if (rc)
 306			msleep(100);
 307		rc = plpar_hcall_norets(H_FREE_CRQ, vdev->unit_address);
 308	} while ((rc == H_BUSY) || (H_IS_LONG_BUSY(rc)));
 309
 310	/* Clean out the queue */
 311	memset(queue->msgs, 0x00, PAGE_SIZE);
 312	queue->cur = 0;
 313
 314	set_adapter_info(hostdata);
 315
 316	/* And re-open it again */
 317	rc = plpar_hcall_norets(H_REG_CRQ,
 318				vdev->unit_address,
 319				queue->msg_token, PAGE_SIZE);
 320	if (rc == H_CLOSED) {
 321		/* Adapter is good, but other end is not ready */
 322		dev_warn(hostdata->dev, "Partner adapter not ready\n");
 323	} else if (rc != 0) {
 324		dev_warn(hostdata->dev, "couldn't register crq--rc 0x%x\n", rc);
 325	}
 326	return rc;
 327}
 328
 329/**
 330 * initialize_crq_queue: - Initializes and registers CRQ with hypervisor
 331 * @queue:	crq_queue to initialize and register
 332 * @hostdata:	ibmvscsi_host_data of host
 333 *
 334 * Allocates a page for messages, maps it for dma, and registers
 335 * the crq with the hypervisor.
 336 * Returns zero on success.
 337 */
 338static int ibmvscsi_init_crq_queue(struct crq_queue *queue,
 339				   struct ibmvscsi_host_data *hostdata,
 340				   int max_requests)
 341{
 342	int rc;
 343	int retrc;
 344	struct vio_dev *vdev = to_vio_dev(hostdata->dev);
 345
 346	queue->msgs = (struct viosrp_crq *)get_zeroed_page(GFP_KERNEL);
 347
 348	if (!queue->msgs)
 349		goto malloc_failed;
 350	queue->size = PAGE_SIZE / sizeof(*queue->msgs);
 351
 352	queue->msg_token = dma_map_single(hostdata->dev, queue->msgs,
 353					  queue->size * sizeof(*queue->msgs),
 354					  DMA_BIDIRECTIONAL);
 355
 356	if (dma_mapping_error(hostdata->dev, queue->msg_token))
 357		goto map_failed;
 358
 359	gather_partition_info();
 360	set_adapter_info(hostdata);
 361
 362	retrc = rc = plpar_hcall_norets(H_REG_CRQ,
 363				vdev->unit_address,
 364				queue->msg_token, PAGE_SIZE);
 365	if (rc == H_RESOURCE)
 366		/* maybe kexecing and resource is busy. try a reset */
 367		rc = ibmvscsi_reset_crq_queue(queue,
 368					      hostdata);
 369
 370	if (rc == H_CLOSED) {
 371		/* Adapter is good, but other end is not ready */
 372		dev_warn(hostdata->dev, "Partner adapter not ready\n");
 373		retrc = 0;
 374	} else if (rc != 0) {
 375		dev_warn(hostdata->dev, "Error %d opening adapter\n", rc);
 376		goto reg_crq_failed;
 377	}
 378
 379	queue->cur = 0;
 380	spin_lock_init(&queue->lock);
 381
 382	tasklet_init(&hostdata->srp_task, (void *)ibmvscsi_task,
 383		     (unsigned long)hostdata);
 384
 385	if (request_irq(vdev->irq,
 386			ibmvscsi_handle_event,
 387			0, "ibmvscsi", (void *)hostdata) != 0) {
 388		dev_err(hostdata->dev, "couldn't register irq 0x%x\n",
 389			vdev->irq);
 390		goto req_irq_failed;
 391	}
 392
 393	rc = vio_enable_interrupts(vdev);
 394	if (rc != 0) {
 395		dev_err(hostdata->dev, "Error %d enabling interrupts!!!\n", rc);
 396		goto req_irq_failed;
 397	}
 398
 399	return retrc;
 400
 401      req_irq_failed:
 402	tasklet_kill(&hostdata->srp_task);
 403	rc = 0;
 404	do {
 405		if (rc)
 406			msleep(100);
 407		rc = plpar_hcall_norets(H_FREE_CRQ, vdev->unit_address);
 408	} while ((rc == H_BUSY) || (H_IS_LONG_BUSY(rc)));
 409      reg_crq_failed:
 410	dma_unmap_single(hostdata->dev,
 411			 queue->msg_token,
 412			 queue->size * sizeof(*queue->msgs), DMA_BIDIRECTIONAL);
 413      map_failed:
 414	free_page((unsigned long)queue->msgs);
 415      malloc_failed:
 416	return -1;
 417}
 418
 419/**
 420 * reenable_crq_queue: - reenables a crq after
 421 * @queue:	crq_queue to initialize and register
 422 * @hostdata:	ibmvscsi_host_data of host
 423 *
 424 */
 425static int ibmvscsi_reenable_crq_queue(struct crq_queue *queue,
 426				       struct ibmvscsi_host_data *hostdata)
 427{
 428	int rc = 0;
 429	struct vio_dev *vdev = to_vio_dev(hostdata->dev);
 430
 431	/* Re-enable the CRQ */
 432	do {
 433		if (rc)
 434			msleep(100);
 435		rc = plpar_hcall_norets(H_ENABLE_CRQ, vdev->unit_address);
 436	} while ((rc == H_IN_PROGRESS) || (rc == H_BUSY) || (H_IS_LONG_BUSY(rc)));
 437
 438	if (rc)
 439		dev_err(hostdata->dev, "Error %d enabling adapter\n", rc);
 440	return rc;
 441}
 442
 443/* ------------------------------------------------------------
 444 * Routines for the event pool and event structs
 445 */
 446/**
 447 * initialize_event_pool: - Allocates and initializes the event pool for a host
 448 * @pool:	event_pool to be initialized
 449 * @size:	Number of events in pool
 450 * @hostdata:	ibmvscsi_host_data who owns the event pool
 451 *
 452 * Returns zero on success.
 453*/
 454static int initialize_event_pool(struct event_pool *pool,
 455				 int size, struct ibmvscsi_host_data *hostdata)
 456{
 457	int i;
 458
 459	pool->size = size;
 460	pool->next = 0;
 461	pool->events = kcalloc(pool->size, sizeof(*pool->events), GFP_KERNEL);
 462	if (!pool->events)
 463		return -ENOMEM;
 464
 465	pool->iu_storage =
 466	    dma_alloc_coherent(hostdata->dev,
 467			       pool->size * sizeof(*pool->iu_storage),
 468			       &pool->iu_token, 0);
 469	if (!pool->iu_storage) {
 470		kfree(pool->events);
 471		return -ENOMEM;
 472	}
 473
 474	for (i = 0; i < pool->size; ++i) {
 475		struct srp_event_struct *evt = &pool->events[i];
 476		memset(&evt->crq, 0x00, sizeof(evt->crq));
 477		atomic_set(&evt->free, 1);
 478		evt->crq.valid = VIOSRP_CRQ_CMD_RSP;
 479		evt->crq.IU_length = cpu_to_be16(sizeof(*evt->xfer_iu));
 480		evt->crq.IU_data_ptr = cpu_to_be64(pool->iu_token +
 481			sizeof(*evt->xfer_iu) * i);
 482		evt->xfer_iu = pool->iu_storage + i;
 483		evt->hostdata = hostdata;
 484		evt->ext_list = NULL;
 485		evt->ext_list_token = 0;
 486	}
 487
 488	return 0;
 489}
 490
 491/**
 492 * release_event_pool: - Frees memory of an event pool of a host
 493 * @pool:	event_pool to be released
 494 * @hostdata:	ibmvscsi_host_data who owns the even pool
 495 *
 496 * Returns zero on success.
 497*/
 498static void release_event_pool(struct event_pool *pool,
 499			       struct ibmvscsi_host_data *hostdata)
 500{
 501	int i, in_use = 0;
 502	for (i = 0; i < pool->size; ++i) {
 503		if (atomic_read(&pool->events[i].free) != 1)
 504			++in_use;
 505		if (pool->events[i].ext_list) {
 506			dma_free_coherent(hostdata->dev,
 507				  SG_ALL * sizeof(struct srp_direct_buf),
 508				  pool->events[i].ext_list,
 509				  pool->events[i].ext_list_token);
 510		}
 511	}
 512	if (in_use)
 513		dev_warn(hostdata->dev, "releasing event pool with %d "
 514			 "events still in use?\n", in_use);
 515	kfree(pool->events);
 516	dma_free_coherent(hostdata->dev,
 517			  pool->size * sizeof(*pool->iu_storage),
 518			  pool->iu_storage, pool->iu_token);
 519}
 520
 521/**
 522 * valid_event_struct: - Determines if event is valid.
 523 * @pool:	event_pool that contains the event
 524 * @evt:	srp_event_struct to be checked for validity
 525 *
 526 * Returns zero if event is invalid, one otherwise.
 527*/
 528static int valid_event_struct(struct event_pool *pool,
 529				struct srp_event_struct *evt)
 530{
 531	int index = evt - pool->events;
 532	if (index < 0 || index >= pool->size)	/* outside of bounds */
 533		return 0;
 534	if (evt != pool->events + index)	/* unaligned */
 535		return 0;
 536	return 1;
 537}
 538
 539/**
 540 * ibmvscsi_free-event_struct: - Changes status of event to "free"
 541 * @pool:	event_pool that contains the event
 542 * @evt:	srp_event_struct to be modified
 543 *
 544*/
 545static void free_event_struct(struct event_pool *pool,
 546				       struct srp_event_struct *evt)
 547{
 548	if (!valid_event_struct(pool, evt)) {
 549		dev_err(evt->hostdata->dev, "Freeing invalid event_struct %p "
 550			"(not in pool %p)\n", evt, pool->events);
 551		return;
 552	}
 553	if (atomic_inc_return(&evt->free) != 1) {
 554		dev_err(evt->hostdata->dev, "Freeing event_struct %p "
 555			"which is not in use!\n", evt);
 556		return;
 557	}
 558}
 559
 560/**
 561 * get_evt_struct: - Gets the next free event in pool
 562 * @pool:	event_pool that contains the events to be searched
 563 *
 564 * Returns the next event in "free" state, and NULL if none are free.
 565 * Note that no synchronization is done here, we assume the host_lock
 566 * will syncrhonze things.
 567*/
 568static struct srp_event_struct *get_event_struct(struct event_pool *pool)
 569{
 570	int i;
 571	int poolsize = pool->size;
 572	int offset = pool->next;
 573
 574	for (i = 0; i < poolsize; i++) {
 575		offset = (offset + 1) % poolsize;
 576		if (!atomic_dec_if_positive(&pool->events[offset].free)) {
 577			pool->next = offset;
 578			return &pool->events[offset];
 579		}
 580	}
 581
 582	printk(KERN_ERR "ibmvscsi: found no event struct in pool!\n");
 583	return NULL;
 584}
 585
 586/**
 587 * init_event_struct: Initialize fields in an event struct that are always 
 588 *                    required.
 589 * @evt:        The event
 590 * @done:       Routine to call when the event is responded to
 591 * @format:     SRP or MAD format
 592 * @timeout:    timeout value set in the CRQ
 593 */
 594static void init_event_struct(struct srp_event_struct *evt_struct,
 595			      void (*done) (struct srp_event_struct *),
 596			      u8 format,
 597			      int timeout)
 598{
 599	evt_struct->cmnd = NULL;
 600	evt_struct->cmnd_done = NULL;
 601	evt_struct->sync_srp = NULL;
 602	evt_struct->crq.format = format;
 603	evt_struct->crq.timeout = cpu_to_be16(timeout);
 604	evt_struct->done = done;
 605}
 606
 607/* ------------------------------------------------------------
 608 * Routines for receiving SCSI responses from the hosting partition
 609 */
 610
 611/**
 612 * set_srp_direction: Set the fields in the srp related to data
 613 *     direction and number of buffers based on the direction in
 614 *     the scsi_cmnd and the number of buffers
 615 */
 616static void set_srp_direction(struct scsi_cmnd *cmd,
 617			      struct srp_cmd *srp_cmd, 
 618			      int numbuf)
 619{
 620	u8 fmt;
 621
 622	if (numbuf == 0)
 623		return;
 624	
 625	if (numbuf == 1)
 626		fmt = SRP_DATA_DESC_DIRECT;
 627	else {
 628		fmt = SRP_DATA_DESC_INDIRECT;
 629		numbuf = min(numbuf, MAX_INDIRECT_BUFS);
 630
 631		if (cmd->sc_data_direction == DMA_TO_DEVICE)
 632			srp_cmd->data_out_desc_cnt = numbuf;
 633		else
 634			srp_cmd->data_in_desc_cnt = numbuf;
 635	}
 636
 637	if (cmd->sc_data_direction == DMA_TO_DEVICE)
 638		srp_cmd->buf_fmt = fmt << 4;
 639	else
 640		srp_cmd->buf_fmt = fmt;
 641}
 642
 643/**
 644 * unmap_cmd_data: - Unmap data pointed in srp_cmd based on the format
 645 * @cmd:	srp_cmd whose additional_data member will be unmapped
 646 * @dev:	device for which the memory is mapped
 647 *
 648*/
 649static void unmap_cmd_data(struct srp_cmd *cmd,
 650			   struct srp_event_struct *evt_struct,
 651			   struct device *dev)
 652{
 653	u8 out_fmt, in_fmt;
 654
 655	out_fmt = cmd->buf_fmt >> 4;
 656	in_fmt = cmd->buf_fmt & ((1U << 4) - 1);
 657
 658	if (out_fmt == SRP_NO_DATA_DESC && in_fmt == SRP_NO_DATA_DESC)
 659		return;
 660
 661	if (evt_struct->cmnd)
 662		scsi_dma_unmap(evt_struct->cmnd);
 663}
 664
 665static int map_sg_list(struct scsi_cmnd *cmd, int nseg,
 666		       struct srp_direct_buf *md)
 667{
 668	int i;
 669	struct scatterlist *sg;
 670	u64 total_length = 0;
 671
 672	scsi_for_each_sg(cmd, sg, nseg, i) {
 673		struct srp_direct_buf *descr = md + i;
 674		descr->va = cpu_to_be64(sg_dma_address(sg));
 675		descr->len = cpu_to_be32(sg_dma_len(sg));
 676		descr->key = 0;
 677		total_length += sg_dma_len(sg);
 678 	}
 679	return total_length;
 680}
 681
 682/**
 683 * map_sg_data: - Maps dma for a scatterlist and initializes decriptor fields
 684 * @cmd:	Scsi_Cmnd with the scatterlist
 685 * @srp_cmd:	srp_cmd that contains the memory descriptor
 686 * @dev:	device for which to map dma memory
 687 *
 688 * Called by map_data_for_srp_cmd() when building srp cmd from scsi cmd.
 689 * Returns 1 on success.
 690*/
 691static int map_sg_data(struct scsi_cmnd *cmd,
 692		       struct srp_event_struct *evt_struct,
 693		       struct srp_cmd *srp_cmd, struct device *dev)
 694{
 695
 696	int sg_mapped;
 697	u64 total_length = 0;
 698	struct srp_direct_buf *data =
 699		(struct srp_direct_buf *) srp_cmd->add_data;
 700	struct srp_indirect_buf *indirect =
 701		(struct srp_indirect_buf *) data;
 702
 703	sg_mapped = scsi_dma_map(cmd);
 704	if (!sg_mapped)
 705		return 1;
 706	else if (sg_mapped < 0)
 707		return 0;
 708
 709	set_srp_direction(cmd, srp_cmd, sg_mapped);
 710
 711	/* special case; we can use a single direct descriptor */
 712	if (sg_mapped == 1) {
 713		map_sg_list(cmd, sg_mapped, data);
 714		return 1;
 715	}
 716
 717	indirect->table_desc.va = 0;
 718	indirect->table_desc.len = cpu_to_be32(sg_mapped *
 719					       sizeof(struct srp_direct_buf));
 720	indirect->table_desc.key = 0;
 721
 722	if (sg_mapped <= MAX_INDIRECT_BUFS) {
 723		total_length = map_sg_list(cmd, sg_mapped,
 724					   &indirect->desc_list[0]);
 725		indirect->len = cpu_to_be32(total_length);
 726		return 1;
 727	}
 728
 729	/* get indirect table */
 730	if (!evt_struct->ext_list) {
 731		evt_struct->ext_list = (struct srp_direct_buf *)
 732			dma_alloc_coherent(dev,
 733					   SG_ALL * sizeof(struct srp_direct_buf),
 734					   &evt_struct->ext_list_token, 0);
 735		if (!evt_struct->ext_list) {
 736			if (!firmware_has_feature(FW_FEATURE_CMO))
 737				sdev_printk(KERN_ERR, cmd->device,
 738				            "Can't allocate memory "
 739				            "for indirect table\n");
 740			scsi_dma_unmap(cmd);
 741			return 0;
 742		}
 743	}
 744
 745	total_length = map_sg_list(cmd, sg_mapped, evt_struct->ext_list);
 746
 747	indirect->len = cpu_to_be32(total_length);
 748	indirect->table_desc.va = cpu_to_be64(evt_struct->ext_list_token);
 749	indirect->table_desc.len = cpu_to_be32(sg_mapped *
 750					       sizeof(indirect->desc_list[0]));
 751	memcpy(indirect->desc_list, evt_struct->ext_list,
 752	       MAX_INDIRECT_BUFS * sizeof(struct srp_direct_buf));
 753 	return 1;
 754}
 755
 756/**
 757 * map_data_for_srp_cmd: - Calls functions to map data for srp cmds
 758 * @cmd:	struct scsi_cmnd with the memory to be mapped
 759 * @srp_cmd:	srp_cmd that contains the memory descriptor
 760 * @dev:	dma device for which to map dma memory
 761 *
 762 * Called by scsi_cmd_to_srp_cmd() when converting scsi cmds to srp cmds 
 763 * Returns 1 on success.
 764*/
 765static int map_data_for_srp_cmd(struct scsi_cmnd *cmd,
 766				struct srp_event_struct *evt_struct,
 767				struct srp_cmd *srp_cmd, struct device *dev)
 768{
 769	switch (cmd->sc_data_direction) {
 770	case DMA_FROM_DEVICE:
 771	case DMA_TO_DEVICE:
 772		break;
 773	case DMA_NONE:
 774		return 1;
 775	case DMA_BIDIRECTIONAL:
 776		sdev_printk(KERN_ERR, cmd->device,
 777			    "Can't map DMA_BIDIRECTIONAL to read/write\n");
 778		return 0;
 779	default:
 780		sdev_printk(KERN_ERR, cmd->device,
 781			    "Unknown data direction 0x%02x; can't map!\n",
 782			    cmd->sc_data_direction);
 783		return 0;
 784	}
 785
 786	return map_sg_data(cmd, evt_struct, srp_cmd, dev);
 787}
 788
 789/**
 790 * purge_requests: Our virtual adapter just shut down.  purge any sent requests
 791 * @hostdata:    the adapter
 792 */
 793static void purge_requests(struct ibmvscsi_host_data *hostdata, int error_code)
 794{
 795	struct srp_event_struct *evt;
 796	unsigned long flags;
 797
 798	spin_lock_irqsave(hostdata->host->host_lock, flags);
 799	while (!list_empty(&hostdata->sent)) {
 800		evt = list_first_entry(&hostdata->sent, struct srp_event_struct, list);
 801		list_del(&evt->list);
 802		del_timer(&evt->timer);
 803
 804		spin_unlock_irqrestore(hostdata->host->host_lock, flags);
 805		if (evt->cmnd) {
 806			evt->cmnd->result = (error_code << 16);
 807			unmap_cmd_data(&evt->iu.srp.cmd, evt,
 808				       evt->hostdata->dev);
 809			if (evt->cmnd_done)
 810				evt->cmnd_done(evt->cmnd);
 811		} else if (evt->done && evt->crq.format != VIOSRP_MAD_FORMAT &&
 812			   evt->iu.srp.login_req.opcode != SRP_LOGIN_REQ)
 813			evt->done(evt);
 814		free_event_struct(&evt->hostdata->pool, evt);
 815		spin_lock_irqsave(hostdata->host->host_lock, flags);
 816	}
 817	spin_unlock_irqrestore(hostdata->host->host_lock, flags);
 818}
 819
 820/**
 821 * ibmvscsi_reset_host - Reset the connection to the server
 822 * @hostdata:	struct ibmvscsi_host_data to reset
 823*/
 824static void ibmvscsi_reset_host(struct ibmvscsi_host_data *hostdata)
 825{
 826	scsi_block_requests(hostdata->host);
 827	atomic_set(&hostdata->request_limit, 0);
 828
 829	purge_requests(hostdata, DID_ERROR);
 830	hostdata->reset_crq = 1;
 831	wake_up(&hostdata->work_wait_q);
 832}
 833
 834/**
 835 * ibmvscsi_timeout - Internal command timeout handler
 836 * @evt_struct:	struct srp_event_struct that timed out
 837 *
 838 * Called when an internally generated command times out
 839*/
 840static void ibmvscsi_timeout(struct timer_list *t)
 841{
 842	struct srp_event_struct *evt_struct = from_timer(evt_struct, t, timer);
 843	struct ibmvscsi_host_data *hostdata = evt_struct->hostdata;
 844
 845	dev_err(hostdata->dev, "Command timed out (%x). Resetting connection\n",
 846		evt_struct->iu.srp.cmd.opcode);
 847
 848	ibmvscsi_reset_host(hostdata);
 849}
 850
 851
 852/* ------------------------------------------------------------
 853 * Routines for sending and receiving SRPs
 854 */
 855/**
 856 * ibmvscsi_send_srp_event: - Transforms event to u64 array and calls send_crq()
 857 * @evt_struct:	evt_struct to be sent
 858 * @hostdata:	ibmvscsi_host_data of host
 859 * @timeout:	timeout in seconds - 0 means do not time command
 860 *
 861 * Returns the value returned from ibmvscsi_send_crq(). (Zero for success)
 862 * Note that this routine assumes that host_lock is held for synchronization
 863*/
 864static int ibmvscsi_send_srp_event(struct srp_event_struct *evt_struct,
 865				   struct ibmvscsi_host_data *hostdata,
 866				   unsigned long timeout)
 867{
 868	__be64 *crq_as_u64 = (__be64 *)&evt_struct->crq;
 869	int request_status = 0;
 870	int rc;
 871	int srp_req = 0;
 872
 873	/* If we have exhausted our request limit, just fail this request,
 874	 * unless it is for a reset or abort.
 875	 * Note that there are rare cases involving driver generated requests 
 876	 * (such as task management requests) that the mid layer may think we
 877	 * can handle more requests (can_queue) when we actually can't
 878	 */
 879	if (evt_struct->crq.format == VIOSRP_SRP_FORMAT) {
 880		srp_req = 1;
 881		request_status =
 882			atomic_dec_if_positive(&hostdata->request_limit);
 883		/* If request limit was -1 when we started, it is now even
 884		 * less than that
 885		 */
 886		if (request_status < -1)
 887			goto send_error;
 888		/* Otherwise, we may have run out of requests. */
 889		/* If request limit was 0 when we started the adapter is in the
 890		 * process of performing a login with the server adapter, or
 891		 * we may have run out of requests.
 892		 */
 893		else if (request_status == -1 &&
 894		         evt_struct->iu.srp.login_req.opcode != SRP_LOGIN_REQ)
 895			goto send_busy;
 896		/* Abort and reset calls should make it through.
 897		 * Nothing except abort and reset should use the last two
 898		 * slots unless we had two or less to begin with.
 899		 */
 900		else if (request_status < 2 &&
 901		         evt_struct->iu.srp.cmd.opcode != SRP_TSK_MGMT) {
 902			/* In the case that we have less than two requests
 903			 * available, check the server limit as a combination
 904			 * of the request limit and the number of requests
 905			 * in-flight (the size of the send list).  If the
 906			 * server limit is greater than 2, return busy so
 907			 * that the last two are reserved for reset and abort.
 908			 */
 909			int server_limit = request_status;
 910			struct srp_event_struct *tmp_evt;
 911
 912			list_for_each_entry(tmp_evt, &hostdata->sent, list) {
 913				server_limit++;
 914			}
 915
 916			if (server_limit > 2)
 917				goto send_busy;
 918		}
 919	}
 920
 921	/* Copy the IU into the transfer area */
 922	*evt_struct->xfer_iu = evt_struct->iu;
 923	evt_struct->xfer_iu->srp.rsp.tag = (u64)evt_struct;
 924
 925	/* Add this to the sent list.  We need to do this 
 926	 * before we actually send 
 927	 * in case it comes back REALLY fast
 928	 */
 929	list_add_tail(&evt_struct->list, &hostdata->sent);
 930
 931	timer_setup(&evt_struct->timer, ibmvscsi_timeout, 0);
 932	if (timeout) {
 
 933		evt_struct->timer.expires = jiffies + (timeout * HZ);
 
 934		add_timer(&evt_struct->timer);
 935	}
 936
 937	rc = ibmvscsi_send_crq(hostdata, be64_to_cpu(crq_as_u64[0]),
 938			       be64_to_cpu(crq_as_u64[1]));
 939	if (rc != 0) {
 940		list_del(&evt_struct->list);
 941		del_timer(&evt_struct->timer);
 942
 943		/* If send_crq returns H_CLOSED, return SCSI_MLQUEUE_HOST_BUSY.
 944		 * Firmware will send a CRQ with a transport event (0xFF) to
 945		 * tell this client what has happened to the transport.  This
 946		 * will be handled in ibmvscsi_handle_crq()
 947		 */
 948		if (rc == H_CLOSED) {
 949			dev_warn(hostdata->dev, "send warning. "
 950			         "Receive queue closed, will retry.\n");
 951			goto send_busy;
 952		}
 953		dev_err(hostdata->dev, "send error %d\n", rc);
 954		if (srp_req)
 955			atomic_inc(&hostdata->request_limit);
 956		goto send_error;
 957	}
 958
 959	return 0;
 960
 961 send_busy:
 962	unmap_cmd_data(&evt_struct->iu.srp.cmd, evt_struct, hostdata->dev);
 963
 964	free_event_struct(&hostdata->pool, evt_struct);
 965	if (srp_req && request_status != -1)
 966		atomic_inc(&hostdata->request_limit);
 967	return SCSI_MLQUEUE_HOST_BUSY;
 968
 969 send_error:
 970	unmap_cmd_data(&evt_struct->iu.srp.cmd, evt_struct, hostdata->dev);
 971
 972	if (evt_struct->cmnd != NULL) {
 973		evt_struct->cmnd->result = DID_ERROR << 16;
 974		evt_struct->cmnd_done(evt_struct->cmnd);
 975	} else if (evt_struct->done)
 976		evt_struct->done(evt_struct);
 977
 978	free_event_struct(&hostdata->pool, evt_struct);
 979	return 0;
 980}
 981
 982/**
 983 * handle_cmd_rsp: -  Handle responses from commands
 984 * @evt_struct:	srp_event_struct to be handled
 985 *
 986 * Used as a callback by when sending scsi cmds.
 987 * Gets called by ibmvscsi_handle_crq()
 988*/
 989static void handle_cmd_rsp(struct srp_event_struct *evt_struct)
 990{
 991	struct srp_rsp *rsp = &evt_struct->xfer_iu->srp.rsp;
 992	struct scsi_cmnd *cmnd = evt_struct->cmnd;
 993
 994	if (unlikely(rsp->opcode != SRP_RSP)) {
 995		if (printk_ratelimit())
 996			dev_warn(evt_struct->hostdata->dev,
 997				 "bad SRP RSP type %#02x\n", rsp->opcode);
 998	}
 999	
1000	if (cmnd) {
1001		cmnd->result |= rsp->status;
1002		if (((cmnd->result >> 1) & 0x1f) == CHECK_CONDITION)
1003			memcpy(cmnd->sense_buffer,
1004			       rsp->data,
1005			       be32_to_cpu(rsp->sense_data_len));
1006		unmap_cmd_data(&evt_struct->iu.srp.cmd, 
1007			       evt_struct, 
1008			       evt_struct->hostdata->dev);
1009
1010		if (rsp->flags & SRP_RSP_FLAG_DOOVER)
1011			scsi_set_resid(cmnd,
1012				       be32_to_cpu(rsp->data_out_res_cnt));
1013		else if (rsp->flags & SRP_RSP_FLAG_DIOVER)
1014			scsi_set_resid(cmnd, be32_to_cpu(rsp->data_in_res_cnt));
1015	}
1016
1017	if (evt_struct->cmnd_done)
1018		evt_struct->cmnd_done(cmnd);
1019}
1020
1021/**
1022 * lun_from_dev: - Returns the lun of the scsi device
1023 * @dev:	struct scsi_device
1024 *
1025*/
1026static inline u16 lun_from_dev(struct scsi_device *dev)
1027{
1028	return (0x2 << 14) | (dev->id << 8) | (dev->channel << 5) | dev->lun;
1029}
1030
1031/**
1032 * ibmvscsi_queue: - The queuecommand function of the scsi template 
1033 * @cmd:	struct scsi_cmnd to be executed
1034 * @done:	Callback function to be called when cmd is completed
1035*/
1036static int ibmvscsi_queuecommand_lck(struct scsi_cmnd *cmnd,
1037				 void (*done) (struct scsi_cmnd *))
1038{
1039	struct srp_cmd *srp_cmd;
1040	struct srp_event_struct *evt_struct;
1041	struct srp_indirect_buf *indirect;
1042	struct ibmvscsi_host_data *hostdata = shost_priv(cmnd->device->host);
1043	u16 lun = lun_from_dev(cmnd->device);
1044	u8 out_fmt, in_fmt;
1045
1046	cmnd->result = (DID_OK << 16);
1047	evt_struct = get_event_struct(&hostdata->pool);
1048	if (!evt_struct)
1049		return SCSI_MLQUEUE_HOST_BUSY;
1050
1051	/* Set up the actual SRP IU */
1052	srp_cmd = &evt_struct->iu.srp.cmd;
1053	memset(srp_cmd, 0x00, SRP_MAX_IU_LEN);
1054	srp_cmd->opcode = SRP_CMD;
1055	memcpy(srp_cmd->cdb, cmnd->cmnd, sizeof(srp_cmd->cdb));
1056	int_to_scsilun(lun, &srp_cmd->lun);
1057
1058	if (!map_data_for_srp_cmd(cmnd, evt_struct, srp_cmd, hostdata->dev)) {
1059		if (!firmware_has_feature(FW_FEATURE_CMO))
1060			sdev_printk(KERN_ERR, cmnd->device,
1061			            "couldn't convert cmd to srp_cmd\n");
1062		free_event_struct(&hostdata->pool, evt_struct);
1063		return SCSI_MLQUEUE_HOST_BUSY;
1064	}
1065
1066	init_event_struct(evt_struct,
1067			  handle_cmd_rsp,
1068			  VIOSRP_SRP_FORMAT,
1069			  cmnd->request->timeout/HZ);
1070
1071	evt_struct->cmnd = cmnd;
1072	evt_struct->cmnd_done = done;
1073
1074	/* Fix up dma address of the buffer itself */
1075	indirect = (struct srp_indirect_buf *) srp_cmd->add_data;
1076	out_fmt = srp_cmd->buf_fmt >> 4;
1077	in_fmt = srp_cmd->buf_fmt & ((1U << 4) - 1);
1078	if ((in_fmt == SRP_DATA_DESC_INDIRECT ||
1079	     out_fmt == SRP_DATA_DESC_INDIRECT) &&
1080	    indirect->table_desc.va == 0) {
1081		indirect->table_desc.va =
1082			cpu_to_be64(be64_to_cpu(evt_struct->crq.IU_data_ptr) +
1083			offsetof(struct srp_cmd, add_data) +
1084			offsetof(struct srp_indirect_buf, desc_list));
1085	}
1086
1087	return ibmvscsi_send_srp_event(evt_struct, hostdata, 0);
1088}
1089
1090static DEF_SCSI_QCMD(ibmvscsi_queuecommand)
1091
1092/* ------------------------------------------------------------
1093 * Routines for driver initialization
1094 */
1095
1096/**
1097 * map_persist_bufs: - Pre-map persistent data for adapter logins
1098 * @hostdata:   ibmvscsi_host_data of host
1099 *
1100 * Map the capabilities and adapter info DMA buffers to avoid runtime failures.
1101 * Return 1 on error, 0 on success.
1102 */
1103static int map_persist_bufs(struct ibmvscsi_host_data *hostdata)
1104{
1105
1106	hostdata->caps_addr = dma_map_single(hostdata->dev, &hostdata->caps,
1107					     sizeof(hostdata->caps), DMA_BIDIRECTIONAL);
1108
1109	if (dma_mapping_error(hostdata->dev, hostdata->caps_addr)) {
1110		dev_err(hostdata->dev, "Unable to map capabilities buffer!\n");
1111		return 1;
1112	}
1113
1114	hostdata->adapter_info_addr = dma_map_single(hostdata->dev,
1115						     &hostdata->madapter_info,
1116						     sizeof(hostdata->madapter_info),
1117						     DMA_BIDIRECTIONAL);
1118	if (dma_mapping_error(hostdata->dev, hostdata->adapter_info_addr)) {
1119		dev_err(hostdata->dev, "Unable to map adapter info buffer!\n");
1120		dma_unmap_single(hostdata->dev, hostdata->caps_addr,
1121				 sizeof(hostdata->caps), DMA_BIDIRECTIONAL);
1122		return 1;
1123	}
1124
1125	return 0;
1126}
1127
1128/**
1129 * unmap_persist_bufs: - Unmap persistent data needed for adapter logins
1130 * @hostdata:   ibmvscsi_host_data of host
1131 *
1132 * Unmap the capabilities and adapter info DMA buffers
1133 */
1134static void unmap_persist_bufs(struct ibmvscsi_host_data *hostdata)
1135{
1136	dma_unmap_single(hostdata->dev, hostdata->caps_addr,
1137			 sizeof(hostdata->caps), DMA_BIDIRECTIONAL);
1138
1139	dma_unmap_single(hostdata->dev, hostdata->adapter_info_addr,
1140			 sizeof(hostdata->madapter_info), DMA_BIDIRECTIONAL);
1141}
1142
1143/**
1144 * login_rsp: - Handle response to SRP login request
1145 * @evt_struct:	srp_event_struct with the response
1146 *
1147 * Used as a "done" callback by when sending srp_login. Gets called
1148 * by ibmvscsi_handle_crq()
1149*/
1150static void login_rsp(struct srp_event_struct *evt_struct)
1151{
1152	struct ibmvscsi_host_data *hostdata = evt_struct->hostdata;
1153	switch (evt_struct->xfer_iu->srp.login_rsp.opcode) {
1154	case SRP_LOGIN_RSP:	/* it worked! */
1155		break;
1156	case SRP_LOGIN_REJ:	/* refused! */
1157		dev_info(hostdata->dev, "SRP_LOGIN_REJ reason %u\n",
1158			 evt_struct->xfer_iu->srp.login_rej.reason);
1159		/* Login failed.  */
1160		atomic_set(&hostdata->request_limit, -1);
1161		return;
1162	default:
1163		dev_err(hostdata->dev, "Invalid login response typecode 0x%02x!\n",
1164			evt_struct->xfer_iu->srp.login_rsp.opcode);
1165		/* Login failed.  */
1166		atomic_set(&hostdata->request_limit, -1);
1167		return;
1168	}
1169
1170	dev_info(hostdata->dev, "SRP_LOGIN succeeded\n");
1171	hostdata->client_migrated = 0;
1172
1173	/* Now we know what the real request-limit is.
1174	 * This value is set rather than added to request_limit because
1175	 * request_limit could have been set to -1 by this client.
1176	 */
1177	atomic_set(&hostdata->request_limit,
1178		   be32_to_cpu(evt_struct->xfer_iu->srp.login_rsp.req_lim_delta));
1179
1180	/* If we had any pending I/Os, kick them */
1181	scsi_unblock_requests(hostdata->host);
1182}
1183
1184/**
1185 * send_srp_login: - Sends the srp login
1186 * @hostdata:	ibmvscsi_host_data of host
1187 *
1188 * Returns zero if successful.
1189*/
1190static int send_srp_login(struct ibmvscsi_host_data *hostdata)
1191{
1192	int rc;
1193	unsigned long flags;
1194	struct srp_login_req *login;
1195	struct srp_event_struct *evt_struct = get_event_struct(&hostdata->pool);
1196
1197	BUG_ON(!evt_struct);
1198	init_event_struct(evt_struct, login_rsp,
1199			  VIOSRP_SRP_FORMAT, login_timeout);
1200
1201	login = &evt_struct->iu.srp.login_req;
1202	memset(login, 0, sizeof(*login));
1203	login->opcode = SRP_LOGIN_REQ;
1204	login->req_it_iu_len = cpu_to_be32(sizeof(union srp_iu));
1205	login->req_buf_fmt = cpu_to_be16(SRP_BUF_FORMAT_DIRECT |
1206					 SRP_BUF_FORMAT_INDIRECT);
1207
1208	spin_lock_irqsave(hostdata->host->host_lock, flags);
1209	/* Start out with a request limit of 0, since this is negotiated in
1210	 * the login request we are just sending and login requests always
1211	 * get sent by the driver regardless of request_limit.
1212	 */
1213	atomic_set(&hostdata->request_limit, 0);
1214
1215	rc = ibmvscsi_send_srp_event(evt_struct, hostdata, login_timeout * 2);
1216	spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1217	dev_info(hostdata->dev, "sent SRP login\n");
1218	return rc;
1219};
1220
1221/**
1222 * capabilities_rsp: - Handle response to MAD adapter capabilities request
1223 * @evt_struct:	srp_event_struct with the response
1224 *
1225 * Used as a "done" callback by when sending adapter_info.
1226 */
1227static void capabilities_rsp(struct srp_event_struct *evt_struct)
1228{
1229	struct ibmvscsi_host_data *hostdata = evt_struct->hostdata;
1230
1231	if (evt_struct->xfer_iu->mad.capabilities.common.status) {
1232		dev_err(hostdata->dev, "error 0x%X getting capabilities info\n",
1233			evt_struct->xfer_iu->mad.capabilities.common.status);
1234	} else {
1235		if (hostdata->caps.migration.common.server_support !=
1236		    cpu_to_be16(SERVER_SUPPORTS_CAP))
1237			dev_info(hostdata->dev, "Partition migration not supported\n");
1238
1239		if (client_reserve) {
1240			if (hostdata->caps.reserve.common.server_support ==
1241			    cpu_to_be16(SERVER_SUPPORTS_CAP))
1242				dev_info(hostdata->dev, "Client reserve enabled\n");
1243			else
1244				dev_info(hostdata->dev, "Client reserve not supported\n");
1245		}
1246	}
1247
1248	send_srp_login(hostdata);
1249}
1250
1251/**
1252 * send_mad_capabilities: - Sends the mad capabilities request
1253 *      and stores the result so it can be retrieved with
1254 * @hostdata:	ibmvscsi_host_data of host
1255 */
1256static void send_mad_capabilities(struct ibmvscsi_host_data *hostdata)
1257{
1258	struct viosrp_capabilities *req;
1259	struct srp_event_struct *evt_struct;
1260	unsigned long flags;
1261	struct device_node *of_node = hostdata->dev->of_node;
1262	const char *location;
1263
1264	evt_struct = get_event_struct(&hostdata->pool);
1265	BUG_ON(!evt_struct);
1266
1267	init_event_struct(evt_struct, capabilities_rsp,
1268			  VIOSRP_MAD_FORMAT, info_timeout);
1269
1270	req = &evt_struct->iu.mad.capabilities;
1271	memset(req, 0, sizeof(*req));
1272
1273	hostdata->caps.flags = cpu_to_be32(CAP_LIST_SUPPORTED);
1274	if (hostdata->client_migrated)
1275		hostdata->caps.flags |= cpu_to_be32(CLIENT_MIGRATED);
1276
1277	strncpy(hostdata->caps.name, dev_name(&hostdata->host->shost_gendev),
1278		sizeof(hostdata->caps.name));
1279	hostdata->caps.name[sizeof(hostdata->caps.name) - 1] = '\0';
1280
1281	location = of_get_property(of_node, "ibm,loc-code", NULL);
1282	location = location ? location : dev_name(hostdata->dev);
1283	strncpy(hostdata->caps.loc, location, sizeof(hostdata->caps.loc));
1284	hostdata->caps.loc[sizeof(hostdata->caps.loc) - 1] = '\0';
1285
1286	req->common.type = cpu_to_be32(VIOSRP_CAPABILITIES_TYPE);
1287	req->buffer = cpu_to_be64(hostdata->caps_addr);
1288
1289	hostdata->caps.migration.common.cap_type =
1290				cpu_to_be32(MIGRATION_CAPABILITIES);
1291	hostdata->caps.migration.common.length =
1292				cpu_to_be16(sizeof(hostdata->caps.migration));
1293	hostdata->caps.migration.common.server_support =
1294				cpu_to_be16(SERVER_SUPPORTS_CAP);
1295	hostdata->caps.migration.ecl = cpu_to_be32(1);
1296
1297	if (client_reserve) {
1298		hostdata->caps.reserve.common.cap_type =
1299					cpu_to_be32(RESERVATION_CAPABILITIES);
1300		hostdata->caps.reserve.common.length =
1301				cpu_to_be16(sizeof(hostdata->caps.reserve));
1302		hostdata->caps.reserve.common.server_support =
1303				cpu_to_be16(SERVER_SUPPORTS_CAP);
1304		hostdata->caps.reserve.type =
1305				cpu_to_be32(CLIENT_RESERVE_SCSI_2);
1306		req->common.length =
1307				cpu_to_be16(sizeof(hostdata->caps));
1308	} else
1309		req->common.length = cpu_to_be16(sizeof(hostdata->caps) -
1310						sizeof(hostdata->caps.reserve));
1311
1312	spin_lock_irqsave(hostdata->host->host_lock, flags);
1313	if (ibmvscsi_send_srp_event(evt_struct, hostdata, info_timeout * 2))
1314		dev_err(hostdata->dev, "couldn't send CAPABILITIES_REQ!\n");
1315	spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1316};
1317
1318/**
1319 * fast_fail_rsp: - Handle response to MAD enable fast fail
1320 * @evt_struct:	srp_event_struct with the response
1321 *
1322 * Used as a "done" callback by when sending enable fast fail. Gets called
1323 * by ibmvscsi_handle_crq()
1324 */
1325static void fast_fail_rsp(struct srp_event_struct *evt_struct)
1326{
1327	struct ibmvscsi_host_data *hostdata = evt_struct->hostdata;
1328	u16 status = be16_to_cpu(evt_struct->xfer_iu->mad.fast_fail.common.status);
1329
1330	if (status == VIOSRP_MAD_NOT_SUPPORTED)
1331		dev_err(hostdata->dev, "fast_fail not supported in server\n");
1332	else if (status == VIOSRP_MAD_FAILED)
1333		dev_err(hostdata->dev, "fast_fail request failed\n");
1334	else if (status != VIOSRP_MAD_SUCCESS)
1335		dev_err(hostdata->dev, "error 0x%X enabling fast_fail\n", status);
1336
1337	send_mad_capabilities(hostdata);
1338}
1339
1340/**
1341 * init_host - Start host initialization
1342 * @hostdata:	ibmvscsi_host_data of host
1343 *
1344 * Returns zero if successful.
1345 */
1346static int enable_fast_fail(struct ibmvscsi_host_data *hostdata)
1347{
1348	int rc;
1349	unsigned long flags;
1350	struct viosrp_fast_fail *fast_fail_mad;
1351	struct srp_event_struct *evt_struct;
1352
1353	if (!fast_fail) {
1354		send_mad_capabilities(hostdata);
1355		return 0;
1356	}
1357
1358	evt_struct = get_event_struct(&hostdata->pool);
1359	BUG_ON(!evt_struct);
1360
1361	init_event_struct(evt_struct, fast_fail_rsp, VIOSRP_MAD_FORMAT, info_timeout);
1362
1363	fast_fail_mad = &evt_struct->iu.mad.fast_fail;
1364	memset(fast_fail_mad, 0, sizeof(*fast_fail_mad));
1365	fast_fail_mad->common.type = cpu_to_be32(VIOSRP_ENABLE_FAST_FAIL);
1366	fast_fail_mad->common.length = cpu_to_be16(sizeof(*fast_fail_mad));
1367
1368	spin_lock_irqsave(hostdata->host->host_lock, flags);
1369	rc = ibmvscsi_send_srp_event(evt_struct, hostdata, info_timeout * 2);
1370	spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1371	return rc;
1372}
1373
1374/**
1375 * adapter_info_rsp: - Handle response to MAD adapter info request
1376 * @evt_struct:	srp_event_struct with the response
1377 *
1378 * Used as a "done" callback by when sending adapter_info. Gets called
1379 * by ibmvscsi_handle_crq()
1380*/
1381static void adapter_info_rsp(struct srp_event_struct *evt_struct)
1382{
1383	struct ibmvscsi_host_data *hostdata = evt_struct->hostdata;
1384
1385	if (evt_struct->xfer_iu->mad.adapter_info.common.status) {
1386		dev_err(hostdata->dev, "error %d getting adapter info\n",
1387			evt_struct->xfer_iu->mad.adapter_info.common.status);
1388	} else {
1389		dev_info(hostdata->dev, "host srp version: %s, "
1390			 "host partition %s (%d), OS %d, max io %u\n",
1391			 hostdata->madapter_info.srp_version,
1392			 hostdata->madapter_info.partition_name,
1393			 be32_to_cpu(hostdata->madapter_info.partition_number),
1394			 be32_to_cpu(hostdata->madapter_info.os_type),
1395			 be32_to_cpu(hostdata->madapter_info.port_max_txu[0]));
1396		
1397		if (hostdata->madapter_info.port_max_txu[0]) 
1398			hostdata->host->max_sectors = 
1399				be32_to_cpu(hostdata->madapter_info.port_max_txu[0]) >> 9;
1400		
1401		if (be32_to_cpu(hostdata->madapter_info.os_type) == SRP_MAD_OS_AIX &&
1402		    strcmp(hostdata->madapter_info.srp_version, "1.6a") <= 0) {
1403			dev_err(hostdata->dev, "host (Ver. %s) doesn't support large transfers\n",
1404				hostdata->madapter_info.srp_version);
1405			dev_err(hostdata->dev, "limiting scatterlists to %d\n",
1406				MAX_INDIRECT_BUFS);
1407			hostdata->host->sg_tablesize = MAX_INDIRECT_BUFS;
1408		}
1409
1410		if (be32_to_cpu(hostdata->madapter_info.os_type) == SRP_MAD_OS_AIX) {
1411			enable_fast_fail(hostdata);
1412			return;
1413		}
1414	}
1415
1416	send_srp_login(hostdata);
1417}
1418
1419/**
1420 * send_mad_adapter_info: - Sends the mad adapter info request
1421 *      and stores the result so it can be retrieved with
1422 *      sysfs.  We COULD consider causing a failure if the
1423 *      returned SRP version doesn't match ours.
1424 * @hostdata:	ibmvscsi_host_data of host
1425 * 
1426 * Returns zero if successful.
1427*/
1428static void send_mad_adapter_info(struct ibmvscsi_host_data *hostdata)
1429{
1430	struct viosrp_adapter_info *req;
1431	struct srp_event_struct *evt_struct;
1432	unsigned long flags;
1433
1434	evt_struct = get_event_struct(&hostdata->pool);
1435	BUG_ON(!evt_struct);
1436
1437	init_event_struct(evt_struct,
1438			  adapter_info_rsp,
1439			  VIOSRP_MAD_FORMAT,
1440			  info_timeout);
1441	
1442	req = &evt_struct->iu.mad.adapter_info;
1443	memset(req, 0x00, sizeof(*req));
1444	
1445	req->common.type = cpu_to_be32(VIOSRP_ADAPTER_INFO_TYPE);
1446	req->common.length = cpu_to_be16(sizeof(hostdata->madapter_info));
1447	req->buffer = cpu_to_be64(hostdata->adapter_info_addr);
1448
1449	spin_lock_irqsave(hostdata->host->host_lock, flags);
1450	if (ibmvscsi_send_srp_event(evt_struct, hostdata, info_timeout * 2))
1451		dev_err(hostdata->dev, "couldn't send ADAPTER_INFO_REQ!\n");
1452	spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1453};
1454
1455/**
1456 * init_adapter: Start virtual adapter initialization sequence
1457 *
1458 */
1459static void init_adapter(struct ibmvscsi_host_data *hostdata)
1460{
1461	send_mad_adapter_info(hostdata);
1462}
1463
1464/**
1465 * sync_completion: Signal that a synchronous command has completed
1466 * Note that after returning from this call, the evt_struct is freed.
1467 * the caller waiting on this completion shouldn't touch the evt_struct
1468 * again.
1469 */
1470static void sync_completion(struct srp_event_struct *evt_struct)
1471{
1472	/* copy the response back */
1473	if (evt_struct->sync_srp)
1474		*evt_struct->sync_srp = *evt_struct->xfer_iu;
1475	
1476	complete(&evt_struct->comp);
1477}
1478
1479/**
1480 * ibmvscsi_abort: Abort a command...from scsi host template
1481 * send this over to the server and wait synchronously for the response
1482 */
1483static int ibmvscsi_eh_abort_handler(struct scsi_cmnd *cmd)
1484{
1485	struct ibmvscsi_host_data *hostdata = shost_priv(cmd->device->host);
1486	struct srp_tsk_mgmt *tsk_mgmt;
1487	struct srp_event_struct *evt;
1488	struct srp_event_struct *tmp_evt, *found_evt;
1489	union viosrp_iu srp_rsp;
1490	int rsp_rc;
1491	unsigned long flags;
1492	u16 lun = lun_from_dev(cmd->device);
1493	unsigned long wait_switch = 0;
1494
1495	/* First, find this command in our sent list so we can figure
1496	 * out the correct tag
1497	 */
1498	spin_lock_irqsave(hostdata->host->host_lock, flags);
1499	wait_switch = jiffies + (init_timeout * HZ);
1500	do {
1501		found_evt = NULL;
1502		list_for_each_entry(tmp_evt, &hostdata->sent, list) {
1503			if (tmp_evt->cmnd == cmd) {
1504				found_evt = tmp_evt;
1505				break;
1506			}
1507		}
1508
1509		if (!found_evt) {
1510			spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1511			return SUCCESS;
1512		}
1513
1514		evt = get_event_struct(&hostdata->pool);
1515		if (evt == NULL) {
1516			spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1517			sdev_printk(KERN_ERR, cmd->device,
1518				"failed to allocate abort event\n");
1519			return FAILED;
1520		}
1521	
1522		init_event_struct(evt,
1523				  sync_completion,
1524				  VIOSRP_SRP_FORMAT,
1525				  abort_timeout);
1526
1527		tsk_mgmt = &evt->iu.srp.tsk_mgmt;
1528	
1529		/* Set up an abort SRP command */
1530		memset(tsk_mgmt, 0x00, sizeof(*tsk_mgmt));
1531		tsk_mgmt->opcode = SRP_TSK_MGMT;
1532		int_to_scsilun(lun, &tsk_mgmt->lun);
1533		tsk_mgmt->tsk_mgmt_func = SRP_TSK_ABORT_TASK;
1534		tsk_mgmt->task_tag = (u64) found_evt;
1535
1536		evt->sync_srp = &srp_rsp;
1537
1538		init_completion(&evt->comp);
1539		rsp_rc = ibmvscsi_send_srp_event(evt, hostdata, abort_timeout * 2);
1540
1541		if (rsp_rc != SCSI_MLQUEUE_HOST_BUSY)
1542			break;
1543
1544		spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1545		msleep(10);
1546		spin_lock_irqsave(hostdata->host->host_lock, flags);
1547	} while (time_before(jiffies, wait_switch));
1548
1549	spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1550
1551	if (rsp_rc != 0) {
1552		sdev_printk(KERN_ERR, cmd->device,
1553			    "failed to send abort() event. rc=%d\n", rsp_rc);
1554		return FAILED;
1555	}
1556
1557	sdev_printk(KERN_INFO, cmd->device,
1558                    "aborting command. lun 0x%llx, tag 0x%llx\n",
1559		    (((u64) lun) << 48), (u64) found_evt);
1560
1561	wait_for_completion(&evt->comp);
1562
1563	/* make sure we got a good response */
1564	if (unlikely(srp_rsp.srp.rsp.opcode != SRP_RSP)) {
1565		if (printk_ratelimit())
1566			sdev_printk(KERN_WARNING, cmd->device, "abort bad SRP RSP type %d\n",
1567				    srp_rsp.srp.rsp.opcode);
1568		return FAILED;
1569	}
1570
1571	if (srp_rsp.srp.rsp.flags & SRP_RSP_FLAG_RSPVALID)
1572		rsp_rc = *((int *)srp_rsp.srp.rsp.data);
1573	else
1574		rsp_rc = srp_rsp.srp.rsp.status;
1575
1576	if (rsp_rc) {
1577		if (printk_ratelimit())
1578			sdev_printk(KERN_WARNING, cmd->device,
1579				    "abort code %d for task tag 0x%llx\n",
1580				    rsp_rc, tsk_mgmt->task_tag);
1581		return FAILED;
1582	}
1583
1584	/* Because we dropped the spinlock above, it's possible
1585	 * The event is no longer in our list.  Make sure it didn't
1586	 * complete while we were aborting
1587	 */
1588	spin_lock_irqsave(hostdata->host->host_lock, flags);
1589	found_evt = NULL;
1590	list_for_each_entry(tmp_evt, &hostdata->sent, list) {
1591		if (tmp_evt->cmnd == cmd) {
1592			found_evt = tmp_evt;
1593			break;
1594		}
1595	}
1596
1597	if (found_evt == NULL) {
1598		spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1599		sdev_printk(KERN_INFO, cmd->device, "aborted task tag 0x%llx completed\n",
1600			    tsk_mgmt->task_tag);
1601		return SUCCESS;
1602	}
1603
1604	sdev_printk(KERN_INFO, cmd->device, "successfully aborted task tag 0x%llx\n",
1605		    tsk_mgmt->task_tag);
1606
1607	cmd->result = (DID_ABORT << 16);
1608	list_del(&found_evt->list);
1609	unmap_cmd_data(&found_evt->iu.srp.cmd, found_evt,
1610		       found_evt->hostdata->dev);
1611	free_event_struct(&found_evt->hostdata->pool, found_evt);
1612	spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1613	atomic_inc(&hostdata->request_limit);
1614	return SUCCESS;
1615}
1616
1617/**
1618 * ibmvscsi_eh_device_reset_handler: Reset a single LUN...from scsi host 
1619 * template send this over to the server and wait synchronously for the 
1620 * response
1621 */
1622static int ibmvscsi_eh_device_reset_handler(struct scsi_cmnd *cmd)
1623{
1624	struct ibmvscsi_host_data *hostdata = shost_priv(cmd->device->host);
1625	struct srp_tsk_mgmt *tsk_mgmt;
1626	struct srp_event_struct *evt;
1627	struct srp_event_struct *tmp_evt, *pos;
1628	union viosrp_iu srp_rsp;
1629	int rsp_rc;
1630	unsigned long flags;
1631	u16 lun = lun_from_dev(cmd->device);
1632	unsigned long wait_switch = 0;
1633
1634	spin_lock_irqsave(hostdata->host->host_lock, flags);
1635	wait_switch = jiffies + (init_timeout * HZ);
1636	do {
1637		evt = get_event_struct(&hostdata->pool);
1638		if (evt == NULL) {
1639			spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1640			sdev_printk(KERN_ERR, cmd->device,
1641				"failed to allocate reset event\n");
1642			return FAILED;
1643		}
1644	
1645		init_event_struct(evt,
1646				  sync_completion,
1647				  VIOSRP_SRP_FORMAT,
1648				  reset_timeout);
1649
1650		tsk_mgmt = &evt->iu.srp.tsk_mgmt;
1651
1652		/* Set up a lun reset SRP command */
1653		memset(tsk_mgmt, 0x00, sizeof(*tsk_mgmt));
1654		tsk_mgmt->opcode = SRP_TSK_MGMT;
1655		int_to_scsilun(lun, &tsk_mgmt->lun);
1656		tsk_mgmt->tsk_mgmt_func = SRP_TSK_LUN_RESET;
1657
1658		evt->sync_srp = &srp_rsp;
1659
1660		init_completion(&evt->comp);
1661		rsp_rc = ibmvscsi_send_srp_event(evt, hostdata, reset_timeout * 2);
1662
1663		if (rsp_rc != SCSI_MLQUEUE_HOST_BUSY)
1664			break;
1665
1666		spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1667		msleep(10);
1668		spin_lock_irqsave(hostdata->host->host_lock, flags);
1669	} while (time_before(jiffies, wait_switch));
1670
1671	spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1672
1673	if (rsp_rc != 0) {
1674		sdev_printk(KERN_ERR, cmd->device,
1675			    "failed to send reset event. rc=%d\n", rsp_rc);
1676		return FAILED;
1677	}
1678
1679	sdev_printk(KERN_INFO, cmd->device, "resetting device. lun 0x%llx\n",
1680		    (((u64) lun) << 48));
1681
1682	wait_for_completion(&evt->comp);
1683
1684	/* make sure we got a good response */
1685	if (unlikely(srp_rsp.srp.rsp.opcode != SRP_RSP)) {
1686		if (printk_ratelimit())
1687			sdev_printk(KERN_WARNING, cmd->device, "reset bad SRP RSP type %d\n",
1688				    srp_rsp.srp.rsp.opcode);
1689		return FAILED;
1690	}
1691
1692	if (srp_rsp.srp.rsp.flags & SRP_RSP_FLAG_RSPVALID)
1693		rsp_rc = *((int *)srp_rsp.srp.rsp.data);
1694	else
1695		rsp_rc = srp_rsp.srp.rsp.status;
1696
1697	if (rsp_rc) {
1698		if (printk_ratelimit())
1699			sdev_printk(KERN_WARNING, cmd->device,
1700				    "reset code %d for task tag 0x%llx\n",
1701				    rsp_rc, tsk_mgmt->task_tag);
1702		return FAILED;
1703	}
1704
1705	/* We need to find all commands for this LUN that have not yet been
1706	 * responded to, and fail them with DID_RESET
1707	 */
1708	spin_lock_irqsave(hostdata->host->host_lock, flags);
1709	list_for_each_entry_safe(tmp_evt, pos, &hostdata->sent, list) {
1710		if ((tmp_evt->cmnd) && (tmp_evt->cmnd->device == cmd->device)) {
1711			if (tmp_evt->cmnd)
1712				tmp_evt->cmnd->result = (DID_RESET << 16);
1713			list_del(&tmp_evt->list);
1714			unmap_cmd_data(&tmp_evt->iu.srp.cmd, tmp_evt,
1715				       tmp_evt->hostdata->dev);
1716			free_event_struct(&tmp_evt->hostdata->pool,
1717						   tmp_evt);
1718			atomic_inc(&hostdata->request_limit);
1719			if (tmp_evt->cmnd_done)
1720				tmp_evt->cmnd_done(tmp_evt->cmnd);
1721			else if (tmp_evt->done)
1722				tmp_evt->done(tmp_evt);
1723		}
1724	}
1725	spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1726	return SUCCESS;
1727}
1728
1729/**
1730 * ibmvscsi_eh_host_reset_handler - Reset the connection to the server
1731 * @cmd:	struct scsi_cmnd having problems
1732*/
1733static int ibmvscsi_eh_host_reset_handler(struct scsi_cmnd *cmd)
1734{
1735	unsigned long wait_switch = 0;
1736	struct ibmvscsi_host_data *hostdata = shost_priv(cmd->device->host);
1737
1738	dev_err(hostdata->dev, "Resetting connection due to error recovery\n");
1739
1740	ibmvscsi_reset_host(hostdata);
1741
1742	for (wait_switch = jiffies + (init_timeout * HZ);
1743	     time_before(jiffies, wait_switch) &&
1744		     atomic_read(&hostdata->request_limit) < 2;) {
1745
1746		msleep(10);
1747	}
1748
1749	if (atomic_read(&hostdata->request_limit) <= 0)
1750		return FAILED;
1751
1752	return SUCCESS;
1753}
1754
1755/**
1756 * ibmvscsi_handle_crq: - Handles and frees received events in the CRQ
1757 * @crq:	Command/Response queue
1758 * @hostdata:	ibmvscsi_host_data of host
1759 *
1760*/
1761static void ibmvscsi_handle_crq(struct viosrp_crq *crq,
1762				struct ibmvscsi_host_data *hostdata)
1763{
1764	long rc;
1765	unsigned long flags;
1766	/* The hypervisor copies our tag value here so no byteswapping */
1767	struct srp_event_struct *evt_struct =
1768			(__force struct srp_event_struct *)crq->IU_data_ptr;
1769	switch (crq->valid) {
1770	case VIOSRP_CRQ_INIT_RSP:		/* initialization */
1771		switch (crq->format) {
1772		case VIOSRP_CRQ_INIT:	/* Initialization message */
1773			dev_info(hostdata->dev, "partner initialized\n");
1774			/* Send back a response */
1775			rc = ibmvscsi_send_crq(hostdata, 0xC002000000000000LL, 0);
1776			if (rc == 0) {
1777				/* Now login */
1778				init_adapter(hostdata);
1779			} else {
1780				dev_err(hostdata->dev, "Unable to send init rsp. rc=%ld\n", rc);
1781			}
1782
1783			break;
1784		case VIOSRP_CRQ_INIT_COMPLETE:	/* Initialization response */
1785			dev_info(hostdata->dev, "partner initialization complete\n");
1786
1787			/* Now login */
1788			init_adapter(hostdata);
1789			break;
1790		default:
1791			dev_err(hostdata->dev, "unknown crq message type: %d\n", crq->format);
1792		}
1793		return;
1794	case VIOSRP_CRQ_XPORT_EVENT:	/* Hypervisor telling us the connection is closed */
1795		scsi_block_requests(hostdata->host);
1796		atomic_set(&hostdata->request_limit, 0);
1797		if (crq->format == 0x06) {
1798			/* We need to re-setup the interpartition connection */
1799			dev_info(hostdata->dev, "Re-enabling adapter!\n");
1800			hostdata->client_migrated = 1;
1801			hostdata->reenable_crq = 1;
1802			purge_requests(hostdata, DID_REQUEUE);
1803			wake_up(&hostdata->work_wait_q);
1804		} else {
1805			dev_err(hostdata->dev, "Virtual adapter failed rc %d!\n",
1806				crq->format);
1807			ibmvscsi_reset_host(hostdata);
1808		}
1809		return;
1810	case VIOSRP_CRQ_CMD_RSP:		/* real payload */
1811		break;
1812	default:
1813		dev_err(hostdata->dev, "got an invalid message type 0x%02x\n",
1814			crq->valid);
1815		return;
1816	}
1817
1818	/* The only kind of payload CRQs we should get are responses to
1819	 * things we send. Make sure this response is to something we
1820	 * actually sent
1821	 */
1822	if (!valid_event_struct(&hostdata->pool, evt_struct)) {
1823		dev_err(hostdata->dev, "returned correlation_token 0x%p is invalid!\n",
1824		       evt_struct);
1825		return;
1826	}
1827
1828	if (atomic_read(&evt_struct->free)) {
1829		dev_err(hostdata->dev, "received duplicate correlation_token 0x%p!\n",
1830			evt_struct);
1831		return;
1832	}
1833
1834	if (crq->format == VIOSRP_SRP_FORMAT)
1835		atomic_add(be32_to_cpu(evt_struct->xfer_iu->srp.rsp.req_lim_delta),
1836			   &hostdata->request_limit);
1837
1838	del_timer(&evt_struct->timer);
1839
1840	if ((crq->status != VIOSRP_OK && crq->status != VIOSRP_OK2) && evt_struct->cmnd)
1841		evt_struct->cmnd->result = DID_ERROR << 16;
1842	if (evt_struct->done)
1843		evt_struct->done(evt_struct);
1844	else
1845		dev_err(hostdata->dev, "returned done() is NULL; not running it!\n");
1846
1847	/*
1848	 * Lock the host_lock before messing with these structures, since we
1849	 * are running in a task context
1850	 */
1851	spin_lock_irqsave(evt_struct->hostdata->host->host_lock, flags);
1852	list_del(&evt_struct->list);
1853	free_event_struct(&evt_struct->hostdata->pool, evt_struct);
1854	spin_unlock_irqrestore(evt_struct->hostdata->host->host_lock, flags);
1855}
1856
1857/**
1858 * ibmvscsi_slave_configure: Set the "allow_restart" flag for each disk.
1859 * @sdev:	struct scsi_device device to configure
1860 *
1861 * Enable allow_restart for a device if it is a disk.  Adjust the
1862 * queue_depth here also as is required by the documentation for
1863 * struct scsi_host_template.
1864 */
1865static int ibmvscsi_slave_configure(struct scsi_device *sdev)
1866{
1867	struct Scsi_Host *shost = sdev->host;
1868	unsigned long lock_flags = 0;
1869
1870	spin_lock_irqsave(shost->host_lock, lock_flags);
1871	if (sdev->type == TYPE_DISK) {
1872		sdev->allow_restart = 1;
1873		blk_queue_rq_timeout(sdev->request_queue, 120 * HZ);
1874	}
1875	spin_unlock_irqrestore(shost->host_lock, lock_flags);
1876	return 0;
1877}
1878
1879/**
1880 * ibmvscsi_change_queue_depth - Change the device's queue depth
1881 * @sdev:	scsi device struct
1882 * @qdepth:	depth to set
1883 * @reason:	calling context
1884 *
1885 * Return value:
1886 * 	actual depth set
1887 **/
1888static int ibmvscsi_change_queue_depth(struct scsi_device *sdev, int qdepth)
1889{
1890	if (qdepth > IBMVSCSI_MAX_CMDS_PER_LUN)
1891		qdepth = IBMVSCSI_MAX_CMDS_PER_LUN;
1892	return scsi_change_queue_depth(sdev, qdepth);
1893}
1894
1895/* ------------------------------------------------------------
1896 * sysfs attributes
1897 */
1898static ssize_t show_host_vhost_loc(struct device *dev,
1899				   struct device_attribute *attr, char *buf)
1900{
1901	struct Scsi_Host *shost = class_to_shost(dev);
1902	struct ibmvscsi_host_data *hostdata = shost_priv(shost);
1903	int len;
1904
1905	len = snprintf(buf, sizeof(hostdata->caps.loc), "%s\n",
1906		       hostdata->caps.loc);
1907	return len;
1908}
1909
1910static struct device_attribute ibmvscsi_host_vhost_loc = {
1911	.attr = {
1912		 .name = "vhost_loc",
1913		 .mode = S_IRUGO,
1914		 },
1915	.show = show_host_vhost_loc,
1916};
1917
1918static ssize_t show_host_vhost_name(struct device *dev,
1919				    struct device_attribute *attr, char *buf)
1920{
1921	struct Scsi_Host *shost = class_to_shost(dev);
1922	struct ibmvscsi_host_data *hostdata = shost_priv(shost);
1923	int len;
1924
1925	len = snprintf(buf, sizeof(hostdata->caps.name), "%s\n",
1926		       hostdata->caps.name);
1927	return len;
1928}
1929
1930static struct device_attribute ibmvscsi_host_vhost_name = {
1931	.attr = {
1932		 .name = "vhost_name",
1933		 .mode = S_IRUGO,
1934		 },
1935	.show = show_host_vhost_name,
1936};
1937
1938static ssize_t show_host_srp_version(struct device *dev,
1939				     struct device_attribute *attr, char *buf)
1940{
1941	struct Scsi_Host *shost = class_to_shost(dev);
1942	struct ibmvscsi_host_data *hostdata = shost_priv(shost);
1943	int len;
1944
1945	len = snprintf(buf, PAGE_SIZE, "%s\n",
1946		       hostdata->madapter_info.srp_version);
1947	return len;
1948}
1949
1950static struct device_attribute ibmvscsi_host_srp_version = {
1951	.attr = {
1952		 .name = "srp_version",
1953		 .mode = S_IRUGO,
1954		 },
1955	.show = show_host_srp_version,
1956};
1957
1958static ssize_t show_host_partition_name(struct device *dev,
1959					struct device_attribute *attr,
1960					char *buf)
1961{
1962	struct Scsi_Host *shost = class_to_shost(dev);
1963	struct ibmvscsi_host_data *hostdata = shost_priv(shost);
1964	int len;
1965
1966	len = snprintf(buf, PAGE_SIZE, "%s\n",
1967		       hostdata->madapter_info.partition_name);
1968	return len;
1969}
1970
1971static struct device_attribute ibmvscsi_host_partition_name = {
1972	.attr = {
1973		 .name = "partition_name",
1974		 .mode = S_IRUGO,
1975		 },
1976	.show = show_host_partition_name,
1977};
1978
1979static ssize_t show_host_partition_number(struct device *dev,
1980					  struct device_attribute *attr,
1981					  char *buf)
1982{
1983	struct Scsi_Host *shost = class_to_shost(dev);
1984	struct ibmvscsi_host_data *hostdata = shost_priv(shost);
1985	int len;
1986
1987	len = snprintf(buf, PAGE_SIZE, "%d\n",
1988		       be32_to_cpu(hostdata->madapter_info.partition_number));
1989	return len;
1990}
1991
1992static struct device_attribute ibmvscsi_host_partition_number = {
1993	.attr = {
1994		 .name = "partition_number",
1995		 .mode = S_IRUGO,
1996		 },
1997	.show = show_host_partition_number,
1998};
1999
2000static ssize_t show_host_mad_version(struct device *dev,
2001				     struct device_attribute *attr, char *buf)
2002{
2003	struct Scsi_Host *shost = class_to_shost(dev);
2004	struct ibmvscsi_host_data *hostdata = shost_priv(shost);
2005	int len;
2006
2007	len = snprintf(buf, PAGE_SIZE, "%d\n",
2008		       be32_to_cpu(hostdata->madapter_info.mad_version));
2009	return len;
2010}
2011
2012static struct device_attribute ibmvscsi_host_mad_version = {
2013	.attr = {
2014		 .name = "mad_version",
2015		 .mode = S_IRUGO,
2016		 },
2017	.show = show_host_mad_version,
2018};
2019
2020static ssize_t show_host_os_type(struct device *dev,
2021				 struct device_attribute *attr, char *buf)
2022{
2023	struct Scsi_Host *shost = class_to_shost(dev);
2024	struct ibmvscsi_host_data *hostdata = shost_priv(shost);
2025	int len;
2026
2027	len = snprintf(buf, PAGE_SIZE, "%d\n",
2028		       be32_to_cpu(hostdata->madapter_info.os_type));
2029	return len;
2030}
2031
2032static struct device_attribute ibmvscsi_host_os_type = {
2033	.attr = {
2034		 .name = "os_type",
2035		 .mode = S_IRUGO,
2036		 },
2037	.show = show_host_os_type,
2038};
2039
2040static ssize_t show_host_config(struct device *dev,
2041				struct device_attribute *attr, char *buf)
2042{
2043	return 0;
2044}
2045
2046static struct device_attribute ibmvscsi_host_config = {
2047	.attr = {
2048		.name = "config",
2049		.mode = S_IRUGO,
2050		},
2051	.show = show_host_config,
2052};
2053
2054static struct device_attribute *ibmvscsi_attrs[] = {
2055	&ibmvscsi_host_vhost_loc,
2056	&ibmvscsi_host_vhost_name,
2057	&ibmvscsi_host_srp_version,
2058	&ibmvscsi_host_partition_name,
2059	&ibmvscsi_host_partition_number,
2060	&ibmvscsi_host_mad_version,
2061	&ibmvscsi_host_os_type,
2062	&ibmvscsi_host_config,
2063	NULL
2064};
2065
2066/* ------------------------------------------------------------
2067 * SCSI driver registration
2068 */
2069static struct scsi_host_template driver_template = {
2070	.module = THIS_MODULE,
2071	.name = "IBM POWER Virtual SCSI Adapter " IBMVSCSI_VERSION,
2072	.proc_name = "ibmvscsi",
2073	.queuecommand = ibmvscsi_queuecommand,
2074	.eh_timed_out = srp_timed_out,
2075	.eh_abort_handler = ibmvscsi_eh_abort_handler,
2076	.eh_device_reset_handler = ibmvscsi_eh_device_reset_handler,
2077	.eh_host_reset_handler = ibmvscsi_eh_host_reset_handler,
2078	.slave_configure = ibmvscsi_slave_configure,
2079	.change_queue_depth = ibmvscsi_change_queue_depth,
2080	.cmd_per_lun = IBMVSCSI_CMDS_PER_LUN_DEFAULT,
2081	.can_queue = IBMVSCSI_MAX_REQUESTS_DEFAULT,
2082	.this_id = -1,
2083	.sg_tablesize = SG_ALL,
2084	.use_clustering = ENABLE_CLUSTERING,
2085	.shost_attrs = ibmvscsi_attrs,
2086};
2087
2088/**
2089 * ibmvscsi_get_desired_dma - Calculate IO memory desired by the driver
2090 *
2091 * @vdev: struct vio_dev for the device whose desired IO mem is to be returned
2092 *
2093 * Return value:
2094 *	Number of bytes of IO data the driver will need to perform well.
2095 */
2096static unsigned long ibmvscsi_get_desired_dma(struct vio_dev *vdev)
2097{
2098	/* iu_storage data allocated in initialize_event_pool */
2099	unsigned long desired_io = max_events * sizeof(union viosrp_iu);
2100
2101	/* add io space for sg data */
2102	desired_io += (IBMVSCSI_MAX_SECTORS_DEFAULT * 512 *
2103	                     IBMVSCSI_CMDS_PER_LUN_DEFAULT);
2104
2105	return desired_io;
2106}
2107
2108static void ibmvscsi_do_work(struct ibmvscsi_host_data *hostdata)
2109{
2110	int rc;
2111	char *action = "reset";
2112
2113	if (hostdata->reset_crq) {
2114		smp_rmb();
2115		hostdata->reset_crq = 0;
2116
2117		rc = ibmvscsi_reset_crq_queue(&hostdata->queue, hostdata);
2118		if (!rc)
2119			rc = ibmvscsi_send_crq(hostdata, 0xC001000000000000LL, 0);
2120		vio_enable_interrupts(to_vio_dev(hostdata->dev));
2121	} else if (hostdata->reenable_crq) {
2122		smp_rmb();
2123		action = "enable";
2124		rc = ibmvscsi_reenable_crq_queue(&hostdata->queue, hostdata);
2125		hostdata->reenable_crq = 0;
2126		if (!rc)
2127			rc = ibmvscsi_send_crq(hostdata, 0xC001000000000000LL, 0);
2128	} else
2129		return;
2130
2131	if (rc) {
2132		atomic_set(&hostdata->request_limit, -1);
2133		dev_err(hostdata->dev, "error after %s\n", action);
2134	}
2135
2136	scsi_unblock_requests(hostdata->host);
2137}
2138
2139static int ibmvscsi_work_to_do(struct ibmvscsi_host_data *hostdata)
2140{
2141	if (kthread_should_stop())
2142		return 1;
2143	else if (hostdata->reset_crq) {
2144		smp_rmb();
2145		return 1;
2146	} else if (hostdata->reenable_crq) {
2147		smp_rmb();
2148		return 1;
2149	}
2150
2151	return 0;
2152}
2153
2154static int ibmvscsi_work(void *data)
2155{
2156	struct ibmvscsi_host_data *hostdata = data;
2157	int rc;
2158
2159	set_user_nice(current, MIN_NICE);
2160
2161	while (1) {
2162		rc = wait_event_interruptible(hostdata->work_wait_q,
2163					      ibmvscsi_work_to_do(hostdata));
2164
2165		BUG_ON(rc);
2166
2167		if (kthread_should_stop())
2168			break;
2169
2170		ibmvscsi_do_work(hostdata);
2171	}
2172
2173	return 0;
2174}
2175
2176/**
2177 * Called by bus code for each adapter
2178 */
2179static int ibmvscsi_probe(struct vio_dev *vdev, const struct vio_device_id *id)
2180{
2181	struct ibmvscsi_host_data *hostdata;
2182	struct Scsi_Host *host;
2183	struct device *dev = &vdev->dev;
2184	struct srp_rport_identifiers ids;
2185	struct srp_rport *rport;
2186	unsigned long wait_switch = 0;
2187	int rc;
2188
2189	dev_set_drvdata(&vdev->dev, NULL);
2190
2191	host = scsi_host_alloc(&driver_template, sizeof(*hostdata));
2192	if (!host) {
2193		dev_err(&vdev->dev, "couldn't allocate host data\n");
2194		goto scsi_host_alloc_failed;
2195	}
2196
2197	host->transportt = ibmvscsi_transport_template;
2198	hostdata = shost_priv(host);
2199	memset(hostdata, 0x00, sizeof(*hostdata));
2200	INIT_LIST_HEAD(&hostdata->sent);
2201	init_waitqueue_head(&hostdata->work_wait_q);
2202	hostdata->host = host;
2203	hostdata->dev = dev;
2204	atomic_set(&hostdata->request_limit, -1);
2205	hostdata->host->max_sectors = IBMVSCSI_MAX_SECTORS_DEFAULT;
2206
2207	if (map_persist_bufs(hostdata)) {
2208		dev_err(&vdev->dev, "couldn't map persistent buffers\n");
2209		goto persist_bufs_failed;
2210	}
2211
2212	hostdata->work_thread = kthread_run(ibmvscsi_work, hostdata, "%s_%d",
2213					    "ibmvscsi", host->host_no);
2214
2215	if (IS_ERR(hostdata->work_thread)) {
2216		dev_err(&vdev->dev, "couldn't initialize kthread. rc=%ld\n",
2217			PTR_ERR(hostdata->work_thread));
2218		goto init_crq_failed;
2219	}
2220
2221	rc = ibmvscsi_init_crq_queue(&hostdata->queue, hostdata, max_events);
2222	if (rc != 0 && rc != H_RESOURCE) {
2223		dev_err(&vdev->dev, "couldn't initialize crq. rc=%d\n", rc);
2224		goto kill_kthread;
2225	}
2226	if (initialize_event_pool(&hostdata->pool, max_events, hostdata) != 0) {
2227		dev_err(&vdev->dev, "couldn't initialize event pool\n");
2228		goto init_pool_failed;
2229	}
2230
2231	host->max_lun = IBMVSCSI_MAX_LUN;
2232	host->max_id = max_id;
2233	host->max_channel = max_channel;
2234	host->max_cmd_len = 16;
2235
2236	dev_info(dev,
2237		 "Maximum ID: %d Maximum LUN: %llu Maximum Channel: %d\n",
2238		 host->max_id, host->max_lun, host->max_channel);
2239
2240	if (scsi_add_host(hostdata->host, hostdata->dev))
2241		goto add_host_failed;
2242
2243	/* we don't have a proper target_port_id so let's use the fake one */
2244	memcpy(ids.port_id, hostdata->madapter_info.partition_name,
2245	       sizeof(ids.port_id));
2246	ids.roles = SRP_RPORT_ROLE_TARGET;
2247	rport = srp_rport_add(host, &ids);
2248	if (IS_ERR(rport))
2249		goto add_srp_port_failed;
2250
2251	/* Try to send an initialization message.  Note that this is allowed
2252	 * to fail if the other end is not acive.  In that case we don't
2253	 * want to scan
2254	 */
2255	if (ibmvscsi_send_crq(hostdata, 0xC001000000000000LL, 0) == 0
2256	    || rc == H_RESOURCE) {
2257		/*
2258		 * Wait around max init_timeout secs for the adapter to finish
2259		 * initializing. When we are done initializing, we will have a
2260		 * valid request_limit.  We don't want Linux scanning before
2261		 * we are ready.
2262		 */
2263		for (wait_switch = jiffies + (init_timeout * HZ);
2264		     time_before(jiffies, wait_switch) &&
2265		     atomic_read(&hostdata->request_limit) < 2;) {
2266
2267			msleep(10);
2268		}
2269
2270		/* if we now have a valid request_limit, initiate a scan */
2271		if (atomic_read(&hostdata->request_limit) > 0)
2272			scsi_scan_host(host);
2273	}
2274
2275	dev_set_drvdata(&vdev->dev, hostdata);
2276	list_add_tail(&hostdata->host_list, &ibmvscsi_head);
2277	return 0;
2278
2279      add_srp_port_failed:
2280	scsi_remove_host(hostdata->host);
2281      add_host_failed:
2282	release_event_pool(&hostdata->pool, hostdata);
2283      init_pool_failed:
2284	ibmvscsi_release_crq_queue(&hostdata->queue, hostdata, max_events);
2285      kill_kthread:
2286      kthread_stop(hostdata->work_thread);
2287      init_crq_failed:
2288	unmap_persist_bufs(hostdata);
2289      persist_bufs_failed:
2290	scsi_host_put(host);
2291      scsi_host_alloc_failed:
2292	return -1;
2293}
2294
2295static int ibmvscsi_remove(struct vio_dev *vdev)
2296{
2297	struct ibmvscsi_host_data *hostdata = dev_get_drvdata(&vdev->dev);
2298	list_del(&hostdata->host_list);
2299	unmap_persist_bufs(hostdata);
2300	release_event_pool(&hostdata->pool, hostdata);
2301	ibmvscsi_release_crq_queue(&hostdata->queue, hostdata,
2302					max_events);
2303
2304	kthread_stop(hostdata->work_thread);
2305	srp_remove_host(hostdata->host);
2306	scsi_remove_host(hostdata->host);
2307	scsi_host_put(hostdata->host);
2308
2309	return 0;
2310}
2311
2312/**
2313 * ibmvscsi_resume: Resume from suspend
2314 * @dev:	device struct
2315 *
2316 * We may have lost an interrupt across suspend/resume, so kick the
2317 * interrupt handler
2318 */
2319static int ibmvscsi_resume(struct device *dev)
2320{
2321	struct ibmvscsi_host_data *hostdata = dev_get_drvdata(dev);
2322	vio_disable_interrupts(to_vio_dev(hostdata->dev));
2323	tasklet_schedule(&hostdata->srp_task);
2324
2325	return 0;
2326}
2327
2328/**
2329 * ibmvscsi_device_table: Used by vio.c to match devices in the device tree we 
2330 * support.
2331 */
2332static const struct vio_device_id ibmvscsi_device_table[] = {
2333	{"vscsi", "IBM,v-scsi"},
2334	{ "", "" }
2335};
2336MODULE_DEVICE_TABLE(vio, ibmvscsi_device_table);
2337
2338static const struct dev_pm_ops ibmvscsi_pm_ops = {
2339	.resume = ibmvscsi_resume
2340};
2341
2342static struct vio_driver ibmvscsi_driver = {
2343	.id_table = ibmvscsi_device_table,
2344	.probe = ibmvscsi_probe,
2345	.remove = ibmvscsi_remove,
2346	.get_desired_dma = ibmvscsi_get_desired_dma,
2347	.name = "ibmvscsi",
2348	.pm = &ibmvscsi_pm_ops,
2349};
2350
2351static struct srp_function_template ibmvscsi_transport_functions = {
2352};
2353
2354int __init ibmvscsi_module_init(void)
2355{
2356	int ret;
2357
2358	/* Ensure we have two requests to do error recovery */
2359	driver_template.can_queue = max_requests;
2360	max_events = max_requests + 2;
2361
2362	if (!firmware_has_feature(FW_FEATURE_VIO))
2363		return -ENODEV;
2364
2365	ibmvscsi_transport_template =
2366		srp_attach_transport(&ibmvscsi_transport_functions);
2367	if (!ibmvscsi_transport_template)
2368		return -ENOMEM;
2369
2370	ret = vio_register_driver(&ibmvscsi_driver);
2371	if (ret)
2372		srp_release_transport(ibmvscsi_transport_template);
2373	return ret;
2374}
2375
2376void __exit ibmvscsi_module_exit(void)
2377{
2378	vio_unregister_driver(&ibmvscsi_driver);
2379	srp_release_transport(ibmvscsi_transport_template);
2380}
2381
2382module_init(ibmvscsi_module_init);
2383module_exit(ibmvscsi_module_exit);