8cec5230fe313fd53557af39b361a044c3eca5f6
[sfrench/cifs-2.6.git] / drivers / scsi / ibmvscsi / ibmvscsi.c
1 /* ------------------------------------------------------------
2  * ibmvscsi.c
3  * (C) Copyright IBM Corporation 1994, 2004
4  * Authors: Colin DeVilbiss (devilbis@us.ibm.com)
5  *          Santiago Leon (santil@us.ibm.com)
6  *          Dave Boutcher (sleddog@us.ibm.com)
7  *
8  * This program is free software; you can redistribute it and/or modify
9  * it under the terms of the GNU General Public License as published by
10  * the Free Software Foundation; either version 2 of the License, or
11  * (at your option) any later version.
12  *
13  * This program is distributed in the hope that it will be useful,
14  * but WITHOUT ANY WARRANTY; without even the implied warranty of
15  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
16  * GNU General Public License for more details.
17  *
18  * You should have received a copy of the GNU General Public License
19  * along with this program; if not, write to the Free Software
20  * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307
21  * USA
22  *
23  * ------------------------------------------------------------
24  * Emulation of a SCSI host adapter for Virtual I/O devices
25  *
26  * This driver supports the SCSI adapter implemented by the IBM
27  * Power5 firmware.  That SCSI adapter is not a physical adapter,
28  * but allows Linux SCSI peripheral drivers to directly
29  * access devices in another logical partition on the physical system.
30  *
31  * The virtual adapter(s) are present in the open firmware device
32  * tree just like real adapters.
33  *
34  * One of the capabilities provided on these systems is the ability
35  * to DMA between partitions.  The architecture states that for VSCSI,
36  * the server side is allowed to DMA to and from the client.  The client
37  * is never trusted to DMA to or from the server directly.
38  *
39  * Messages are sent between partitions on a "Command/Response Queue" 
40  * (CRQ), which is just a buffer of 16 byte entries in the receiver's 
41  * Senders cannot access the buffer directly, but send messages by
42  * making a hypervisor call and passing in the 16 bytes.  The hypervisor
43  * puts the message in the next 16 byte space in round-robin fashion,
44  * turns on the high order bit of the message (the valid bit), and 
45  * generates an interrupt to the receiver (if interrupts are turned on.) 
46  * The receiver just turns off the valid bit when they have copied out
47  * the message.
48  *
49  * The VSCSI client builds a SCSI Remote Protocol (SRP) Information Unit
50  * (IU) (as defined in the T10 standard available at www.t10.org), gets 
51  * a DMA address for the message, and sends it to the server as the
52  * payload of a CRQ message.  The server DMAs the SRP IU and processes it,
53  * including doing any additional data transfers.  When it is done, it
54  * DMAs the SRP response back to the same address as the request came from,
55  * and sends a CRQ message back to inform the client that the request has
56  * completed.
57  *
58  * TODO: This is currently pretty tied to the IBM pSeries hypervisor
59  * interfaces.  It would be really nice to abstract this above an RDMA
60  * layer.
61  */
62
63 #include <linux/module.h>
64 #include <linux/moduleparam.h>
65 #include <linux/dma-mapping.h>
66 #include <linux/delay.h>
67 #include <linux/slab.h>
68 #include <linux/of.h>
69 #include <linux/pm.h>
70 #include <linux/kthread.h>
71 #include <asm/firmware.h>
72 #include <asm/vio.h>
73 #include <scsi/scsi.h>
74 #include <scsi/scsi_cmnd.h>
75 #include <scsi/scsi_host.h>
76 #include <scsi/scsi_device.h>
77 #include <scsi/scsi_transport_srp.h>
78 #include "ibmvscsi.h"
79
80 /* The values below are somewhat arbitrary default values, but 
81  * OS/400 will use 3 busses (disks, CDs, tapes, I think.)
82  * Note that there are 3 bits of channel value, 6 bits of id, and
83  * 5 bits of LUN.
84  */
85 static int max_id = 64;
86 static int max_channel = 3;
87 static int init_timeout = 300;
88 static int login_timeout = 60;
89 static int info_timeout = 30;
90 static int abort_timeout = 60;
91 static int reset_timeout = 60;
92 static int max_requests = IBMVSCSI_MAX_REQUESTS_DEFAULT;
93 static int max_events = IBMVSCSI_MAX_REQUESTS_DEFAULT + 2;
94 static int fast_fail = 1;
95 static int client_reserve = 1;
96 static char partition_name[96] = "UNKNOWN";
97 static unsigned int partition_number = -1;
98 static LIST_HEAD(ibmvscsi_head);
99 static DEFINE_SPINLOCK(ibmvscsi_driver_lock);
100
101 static struct scsi_transport_template *ibmvscsi_transport_template;
102
103 #define IBMVSCSI_VERSION "1.5.9"
104
105 MODULE_DESCRIPTION("IBM Virtual SCSI");
106 MODULE_AUTHOR("Dave Boutcher");
107 MODULE_LICENSE("GPL");
108 MODULE_VERSION(IBMVSCSI_VERSION);
109
110 module_param_named(max_id, max_id, int, S_IRUGO | S_IWUSR);
111 MODULE_PARM_DESC(max_id, "Largest ID value for each channel [Default=64]");
112 module_param_named(max_channel, max_channel, int, S_IRUGO | S_IWUSR);
113 MODULE_PARM_DESC(max_channel, "Largest channel value [Default=3]");
114 module_param_named(init_timeout, init_timeout, int, S_IRUGO | S_IWUSR);
115 MODULE_PARM_DESC(init_timeout, "Initialization timeout in seconds");
116 module_param_named(max_requests, max_requests, int, S_IRUGO);
117 MODULE_PARM_DESC(max_requests, "Maximum requests for this adapter");
118 module_param_named(fast_fail, fast_fail, int, S_IRUGO | S_IWUSR);
119 MODULE_PARM_DESC(fast_fail, "Enable fast fail. [Default=1]");
120 module_param_named(client_reserve, client_reserve, int, S_IRUGO );
121 MODULE_PARM_DESC(client_reserve, "Attempt client managed reserve/release");
122
123 static void ibmvscsi_handle_crq(struct viosrp_crq *crq,
124                                 struct ibmvscsi_host_data *hostdata);
125
126 /* ------------------------------------------------------------
127  * Routines for managing the command/response queue
128  */
129 /**
130  * ibmvscsi_handle_event: - Interrupt handler for crq events
131  * @irq:        number of irq to handle, not used
132  * @dev_instance: ibmvscsi_host_data of host that received interrupt
133  *
134  * Disables interrupts and schedules srp_task
135  * Always returns IRQ_HANDLED
136  */
137 static irqreturn_t ibmvscsi_handle_event(int irq, void *dev_instance)
138 {
139         struct ibmvscsi_host_data *hostdata =
140             (struct ibmvscsi_host_data *)dev_instance;
141         vio_disable_interrupts(to_vio_dev(hostdata->dev));
142         tasklet_schedule(&hostdata->srp_task);
143         return IRQ_HANDLED;
144 }
145
146 /**
147  * release_crq_queue: - Deallocates data and unregisters CRQ
148  * @queue:      crq_queue to initialize and register
149  * @host_data:  ibmvscsi_host_data of host
150  *
151  * Frees irq, deallocates a page for messages, unmaps dma, and unregisters
152  * the crq with the hypervisor.
153  */
154 static void ibmvscsi_release_crq_queue(struct crq_queue *queue,
155                                        struct ibmvscsi_host_data *hostdata,
156                                        int max_requests)
157 {
158         long rc = 0;
159         struct vio_dev *vdev = to_vio_dev(hostdata->dev);
160         free_irq(vdev->irq, (void *)hostdata);
161         tasklet_kill(&hostdata->srp_task);
162         do {
163                 if (rc)
164                         msleep(100);
165                 rc = plpar_hcall_norets(H_FREE_CRQ, vdev->unit_address);
166         } while ((rc == H_BUSY) || (H_IS_LONG_BUSY(rc)));
167         dma_unmap_single(hostdata->dev,
168                          queue->msg_token,
169                          queue->size * sizeof(*queue->msgs), DMA_BIDIRECTIONAL);
170         free_page((unsigned long)queue->msgs);
171 }
172
173 /**
174  * crq_queue_next_crq: - Returns the next entry in message queue
175  * @queue:      crq_queue to use
176  *
177  * Returns pointer to next entry in queue, or NULL if there are no new
178  * entried in the CRQ.
179  */
180 static struct viosrp_crq *crq_queue_next_crq(struct crq_queue *queue)
181 {
182         struct viosrp_crq *crq;
183         unsigned long flags;
184
185         spin_lock_irqsave(&queue->lock, flags);
186         crq = &queue->msgs[queue->cur];
187         if (crq->valid != VIOSRP_CRQ_FREE) {
188                 if (++queue->cur == queue->size)
189                         queue->cur = 0;
190
191                 /* Ensure the read of the valid bit occurs before reading any
192                  * other bits of the CRQ entry
193                  */
194                 rmb();
195         } else
196                 crq = NULL;
197         spin_unlock_irqrestore(&queue->lock, flags);
198
199         return crq;
200 }
201
202 /**
203  * ibmvscsi_send_crq: - Send a CRQ
204  * @hostdata:   the adapter
205  * @word1:      the first 64 bits of the data
206  * @word2:      the second 64 bits of the data
207  */
208 static int ibmvscsi_send_crq(struct ibmvscsi_host_data *hostdata,
209                              u64 word1, u64 word2)
210 {
211         struct vio_dev *vdev = to_vio_dev(hostdata->dev);
212
213         /*
214          * Ensure the command buffer is flushed to memory before handing it
215          * over to the VIOS to prevent it from fetching any stale data.
216          */
217         mb();
218         return plpar_hcall_norets(H_SEND_CRQ, vdev->unit_address, word1, word2);
219 }
220
221 /**
222  * ibmvscsi_task: - Process srps asynchronously
223  * @data:       ibmvscsi_host_data of host
224  */
225 static void ibmvscsi_task(void *data)
226 {
227         struct ibmvscsi_host_data *hostdata = (struct ibmvscsi_host_data *)data;
228         struct vio_dev *vdev = to_vio_dev(hostdata->dev);
229         struct viosrp_crq *crq;
230         int done = 0;
231
232         while (!done) {
233                 /* Pull all the valid messages off the CRQ */
234                 while ((crq = crq_queue_next_crq(&hostdata->queue)) != NULL) {
235                         ibmvscsi_handle_crq(crq, hostdata);
236                         crq->valid = VIOSRP_CRQ_FREE;
237                         wmb();
238                 }
239
240                 vio_enable_interrupts(vdev);
241                 crq = crq_queue_next_crq(&hostdata->queue);
242                 if (crq != NULL) {
243                         vio_disable_interrupts(vdev);
244                         ibmvscsi_handle_crq(crq, hostdata);
245                         crq->valid = VIOSRP_CRQ_FREE;
246                         wmb();
247                 } else {
248                         done = 1;
249                 }
250         }
251 }
252
253 static void gather_partition_info(void)
254 {
255         const char *ppartition_name;
256         const __be32 *p_number_ptr;
257
258         /* Retrieve information about this partition */
259         if (!of_root)
260                 return;
261
262         of_node_get(of_root);
263
264         ppartition_name = of_get_property(of_root, "ibm,partition-name", NULL);
265         if (ppartition_name)
266                 strlcpy(partition_name, ppartition_name,
267                                 sizeof(partition_name));
268         p_number_ptr = of_get_property(of_root, "ibm,partition-no", NULL);
269         if (p_number_ptr)
270                 partition_number = of_read_number(p_number_ptr, 1);
271         of_node_put(of_root);
272 }
273
274 static void set_adapter_info(struct ibmvscsi_host_data *hostdata)
275 {
276         memset(&hostdata->madapter_info, 0x00,
277                         sizeof(hostdata->madapter_info));
278
279         dev_info(hostdata->dev, "SRP_VERSION: %s\n", SRP_VERSION);
280         strcpy(hostdata->madapter_info.srp_version, SRP_VERSION);
281
282         strncpy(hostdata->madapter_info.partition_name, partition_name,
283                         sizeof(hostdata->madapter_info.partition_name));
284
285         hostdata->madapter_info.partition_number =
286                                         cpu_to_be32(partition_number);
287
288         hostdata->madapter_info.mad_version = cpu_to_be32(SRP_MAD_VERSION_1);
289         hostdata->madapter_info.os_type = cpu_to_be32(SRP_MAD_OS_LINUX);
290 }
291
292 /**
293  * reset_crq_queue: - resets a crq after a failure
294  * @queue:      crq_queue to initialize and register
295  * @hostdata:   ibmvscsi_host_data of host
296  *
297  */
298 static int ibmvscsi_reset_crq_queue(struct crq_queue *queue,
299                                     struct ibmvscsi_host_data *hostdata)
300 {
301         int rc = 0;
302         struct vio_dev *vdev = to_vio_dev(hostdata->dev);
303
304         /* Close the CRQ */
305         do {
306                 if (rc)
307                         msleep(100);
308                 rc = plpar_hcall_norets(H_FREE_CRQ, vdev->unit_address);
309         } while ((rc == H_BUSY) || (H_IS_LONG_BUSY(rc)));
310
311         /* Clean out the queue */
312         memset(queue->msgs, 0x00, PAGE_SIZE);
313         queue->cur = 0;
314
315         set_adapter_info(hostdata);
316
317         /* And re-open it again */
318         rc = plpar_hcall_norets(H_REG_CRQ,
319                                 vdev->unit_address,
320                                 queue->msg_token, PAGE_SIZE);
321         if (rc == H_CLOSED) {
322                 /* Adapter is good, but other end is not ready */
323                 dev_warn(hostdata->dev, "Partner adapter not ready\n");
324         } else if (rc != 0) {
325                 dev_warn(hostdata->dev, "couldn't register crq--rc 0x%x\n", rc);
326         }
327         return rc;
328 }
329
330 /**
331  * initialize_crq_queue: - Initializes and registers CRQ with hypervisor
332  * @queue:      crq_queue to initialize and register
333  * @hostdata:   ibmvscsi_host_data of host
334  *
335  * Allocates a page for messages, maps it for dma, and registers
336  * the crq with the hypervisor.
337  * Returns zero on success.
338  */
339 static int ibmvscsi_init_crq_queue(struct crq_queue *queue,
340                                    struct ibmvscsi_host_data *hostdata,
341                                    int max_requests)
342 {
343         int rc;
344         int retrc;
345         struct vio_dev *vdev = to_vio_dev(hostdata->dev);
346
347         queue->msgs = (struct viosrp_crq *)get_zeroed_page(GFP_KERNEL);
348
349         if (!queue->msgs)
350                 goto malloc_failed;
351         queue->size = PAGE_SIZE / sizeof(*queue->msgs);
352
353         queue->msg_token = dma_map_single(hostdata->dev, queue->msgs,
354                                           queue->size * sizeof(*queue->msgs),
355                                           DMA_BIDIRECTIONAL);
356
357         if (dma_mapping_error(hostdata->dev, queue->msg_token))
358                 goto map_failed;
359
360         gather_partition_info();
361         set_adapter_info(hostdata);
362
363         retrc = rc = plpar_hcall_norets(H_REG_CRQ,
364                                 vdev->unit_address,
365                                 queue->msg_token, PAGE_SIZE);
366         if (rc == H_RESOURCE)
367                 /* maybe kexecing and resource is busy. try a reset */
368                 rc = ibmvscsi_reset_crq_queue(queue,
369                                               hostdata);
370
371         if (rc == H_CLOSED) {
372                 /* Adapter is good, but other end is not ready */
373                 dev_warn(hostdata->dev, "Partner adapter not ready\n");
374                 retrc = 0;
375         } else if (rc != 0) {
376                 dev_warn(hostdata->dev, "Error %d opening adapter\n", rc);
377                 goto reg_crq_failed;
378         }
379
380         queue->cur = 0;
381         spin_lock_init(&queue->lock);
382
383         tasklet_init(&hostdata->srp_task, (void *)ibmvscsi_task,
384                      (unsigned long)hostdata);
385
386         if (request_irq(vdev->irq,
387                         ibmvscsi_handle_event,
388                         0, "ibmvscsi", (void *)hostdata) != 0) {
389                 dev_err(hostdata->dev, "couldn't register irq 0x%x\n",
390                         vdev->irq);
391                 goto req_irq_failed;
392         }
393
394         rc = vio_enable_interrupts(vdev);
395         if (rc != 0) {
396                 dev_err(hostdata->dev, "Error %d enabling interrupts!!!\n", rc);
397                 goto req_irq_failed;
398         }
399
400         return retrc;
401
402       req_irq_failed:
403         tasklet_kill(&hostdata->srp_task);
404         rc = 0;
405         do {
406                 if (rc)
407                         msleep(100);
408                 rc = plpar_hcall_norets(H_FREE_CRQ, vdev->unit_address);
409         } while ((rc == H_BUSY) || (H_IS_LONG_BUSY(rc)));
410       reg_crq_failed:
411         dma_unmap_single(hostdata->dev,
412                          queue->msg_token,
413                          queue->size * sizeof(*queue->msgs), DMA_BIDIRECTIONAL);
414       map_failed:
415         free_page((unsigned long)queue->msgs);
416       malloc_failed:
417         return -1;
418 }
419
420 /**
421  * reenable_crq_queue: - reenables a crq after
422  * @queue:      crq_queue to initialize and register
423  * @hostdata:   ibmvscsi_host_data of host
424  *
425  */
426 static int ibmvscsi_reenable_crq_queue(struct crq_queue *queue,
427                                        struct ibmvscsi_host_data *hostdata)
428 {
429         int rc = 0;
430         struct vio_dev *vdev = to_vio_dev(hostdata->dev);
431
432         /* Re-enable the CRQ */
433         do {
434                 if (rc)
435                         msleep(100);
436                 rc = plpar_hcall_norets(H_ENABLE_CRQ, vdev->unit_address);
437         } while ((rc == H_IN_PROGRESS) || (rc == H_BUSY) || (H_IS_LONG_BUSY(rc)));
438
439         if (rc)
440                 dev_err(hostdata->dev, "Error %d enabling adapter\n", rc);
441         return rc;
442 }
443
444 /* ------------------------------------------------------------
445  * Routines for the event pool and event structs
446  */
447 /**
448  * initialize_event_pool: - Allocates and initializes the event pool for a host
449  * @pool:       event_pool to be initialized
450  * @size:       Number of events in pool
451  * @hostdata:   ibmvscsi_host_data who owns the event pool
452  *
453  * Returns zero on success.
454 */
455 static int initialize_event_pool(struct event_pool *pool,
456                                  int size, struct ibmvscsi_host_data *hostdata)
457 {
458         int i;
459
460         pool->size = size;
461         pool->next = 0;
462         pool->events = kcalloc(pool->size, sizeof(*pool->events), GFP_KERNEL);
463         if (!pool->events)
464                 return -ENOMEM;
465
466         pool->iu_storage =
467             dma_alloc_coherent(hostdata->dev,
468                                pool->size * sizeof(*pool->iu_storage),
469                                &pool->iu_token, 0);
470         if (!pool->iu_storage) {
471                 kfree(pool->events);
472                 return -ENOMEM;
473         }
474
475         for (i = 0; i < pool->size; ++i) {
476                 struct srp_event_struct *evt = &pool->events[i];
477                 memset(&evt->crq, 0x00, sizeof(evt->crq));
478                 atomic_set(&evt->free, 1);
479                 evt->crq.valid = VIOSRP_CRQ_CMD_RSP;
480                 evt->crq.IU_length = cpu_to_be16(sizeof(*evt->xfer_iu));
481                 evt->crq.IU_data_ptr = cpu_to_be64(pool->iu_token +
482                         sizeof(*evt->xfer_iu) * i);
483                 evt->xfer_iu = pool->iu_storage + i;
484                 evt->hostdata = hostdata;
485                 evt->ext_list = NULL;
486                 evt->ext_list_token = 0;
487         }
488
489         return 0;
490 }
491
492 /**
493  * release_event_pool: - Frees memory of an event pool of a host
494  * @pool:       event_pool to be released
495  * @hostdata:   ibmvscsi_host_data who owns the even pool
496  *
497  * Returns zero on success.
498 */
499 static void release_event_pool(struct event_pool *pool,
500                                struct ibmvscsi_host_data *hostdata)
501 {
502         int i, in_use = 0;
503         for (i = 0; i < pool->size; ++i) {
504                 if (atomic_read(&pool->events[i].free) != 1)
505                         ++in_use;
506                 if (pool->events[i].ext_list) {
507                         dma_free_coherent(hostdata->dev,
508                                   SG_ALL * sizeof(struct srp_direct_buf),
509                                   pool->events[i].ext_list,
510                                   pool->events[i].ext_list_token);
511                 }
512         }
513         if (in_use)
514                 dev_warn(hostdata->dev, "releasing event pool with %d "
515                          "events still in use?\n", in_use);
516         kfree(pool->events);
517         dma_free_coherent(hostdata->dev,
518                           pool->size * sizeof(*pool->iu_storage),
519                           pool->iu_storage, pool->iu_token);
520 }
521
522 /**
523  * valid_event_struct: - Determines if event is valid.
524  * @pool:       event_pool that contains the event
525  * @evt:        srp_event_struct to be checked for validity
526  *
527  * Returns zero if event is invalid, one otherwise.
528 */
529 static int valid_event_struct(struct event_pool *pool,
530                                 struct srp_event_struct *evt)
531 {
532         int index = evt - pool->events;
533         if (index < 0 || index >= pool->size)   /* outside of bounds */
534                 return 0;
535         if (evt != pool->events + index)        /* unaligned */
536                 return 0;
537         return 1;
538 }
539
540 /**
541  * ibmvscsi_free-event_struct: - Changes status of event to "free"
542  * @pool:       event_pool that contains the event
543  * @evt:        srp_event_struct to be modified
544  *
545 */
546 static void free_event_struct(struct event_pool *pool,
547                                        struct srp_event_struct *evt)
548 {
549         if (!valid_event_struct(pool, evt)) {
550                 dev_err(evt->hostdata->dev, "Freeing invalid event_struct %p "
551                         "(not in pool %p)\n", evt, pool->events);
552                 return;
553         }
554         if (atomic_inc_return(&evt->free) != 1) {
555                 dev_err(evt->hostdata->dev, "Freeing event_struct %p "
556                         "which is not in use!\n", evt);
557                 return;
558         }
559 }
560
561 /**
562  * get_evt_struct: - Gets the next free event in pool
563  * @pool:       event_pool that contains the events to be searched
564  *
565  * Returns the next event in "free" state, and NULL if none are free.
566  * Note that no synchronization is done here, we assume the host_lock
567  * will syncrhonze things.
568 */
569 static struct srp_event_struct *get_event_struct(struct event_pool *pool)
570 {
571         int i;
572         int poolsize = pool->size;
573         int offset = pool->next;
574
575         for (i = 0; i < poolsize; i++) {
576                 offset = (offset + 1) % poolsize;
577                 if (!atomic_dec_if_positive(&pool->events[offset].free)) {
578                         pool->next = offset;
579                         return &pool->events[offset];
580                 }
581         }
582
583         printk(KERN_ERR "ibmvscsi: found no event struct in pool!\n");
584         return NULL;
585 }
586
587 /**
588  * init_event_struct: Initialize fields in an event struct that are always 
589  *                    required.
590  * @evt:        The event
591  * @done:       Routine to call when the event is responded to
592  * @format:     SRP or MAD format
593  * @timeout:    timeout value set in the CRQ
594  */
595 static void init_event_struct(struct srp_event_struct *evt_struct,
596                               void (*done) (struct srp_event_struct *),
597                               u8 format,
598                               int timeout)
599 {
600         evt_struct->cmnd = NULL;
601         evt_struct->cmnd_done = NULL;
602         evt_struct->sync_srp = NULL;
603         evt_struct->crq.format = format;
604         evt_struct->crq.timeout = cpu_to_be16(timeout);
605         evt_struct->done = done;
606 }
607
608 /* ------------------------------------------------------------
609  * Routines for receiving SCSI responses from the hosting partition
610  */
611
612 /**
613  * set_srp_direction: Set the fields in the srp related to data
614  *     direction and number of buffers based on the direction in
615  *     the scsi_cmnd and the number of buffers
616  */
617 static void set_srp_direction(struct scsi_cmnd *cmd,
618                               struct srp_cmd *srp_cmd, 
619                               int numbuf)
620 {
621         u8 fmt;
622
623         if (numbuf == 0)
624                 return;
625         
626         if (numbuf == 1)
627                 fmt = SRP_DATA_DESC_DIRECT;
628         else {
629                 fmt = SRP_DATA_DESC_INDIRECT;
630                 numbuf = min(numbuf, MAX_INDIRECT_BUFS);
631
632                 if (cmd->sc_data_direction == DMA_TO_DEVICE)
633                         srp_cmd->data_out_desc_cnt = numbuf;
634                 else
635                         srp_cmd->data_in_desc_cnt = numbuf;
636         }
637
638         if (cmd->sc_data_direction == DMA_TO_DEVICE)
639                 srp_cmd->buf_fmt = fmt << 4;
640         else
641                 srp_cmd->buf_fmt = fmt;
642 }
643
644 /**
645  * unmap_cmd_data: - Unmap data pointed in srp_cmd based on the format
646  * @cmd:        srp_cmd whose additional_data member will be unmapped
647  * @dev:        device for which the memory is mapped
648  *
649 */
650 static void unmap_cmd_data(struct srp_cmd *cmd,
651                            struct srp_event_struct *evt_struct,
652                            struct device *dev)
653 {
654         u8 out_fmt, in_fmt;
655
656         out_fmt = cmd->buf_fmt >> 4;
657         in_fmt = cmd->buf_fmt & ((1U << 4) - 1);
658
659         if (out_fmt == SRP_NO_DATA_DESC && in_fmt == SRP_NO_DATA_DESC)
660                 return;
661
662         if (evt_struct->cmnd)
663                 scsi_dma_unmap(evt_struct->cmnd);
664 }
665
666 static int map_sg_list(struct scsi_cmnd *cmd, int nseg,
667                        struct srp_direct_buf *md)
668 {
669         int i;
670         struct scatterlist *sg;
671         u64 total_length = 0;
672
673         scsi_for_each_sg(cmd, sg, nseg, i) {
674                 struct srp_direct_buf *descr = md + i;
675                 descr->va = cpu_to_be64(sg_dma_address(sg));
676                 descr->len = cpu_to_be32(sg_dma_len(sg));
677                 descr->key = 0;
678                 total_length += sg_dma_len(sg);
679         }
680         return total_length;
681 }
682
683 /**
684  * map_sg_data: - Maps dma for a scatterlist and initializes decriptor fields
685  * @cmd:        struct scsi_cmnd with the scatterlist
686  * @srp_cmd:    srp_cmd that contains the memory descriptor
687  * @dev:        device for which to map dma memory
688  *
689  * Called by map_data_for_srp_cmd() when building srp cmd from scsi cmd.
690  * Returns 1 on success.
691 */
692 static int map_sg_data(struct scsi_cmnd *cmd,
693                        struct srp_event_struct *evt_struct,
694                        struct srp_cmd *srp_cmd, struct device *dev)
695 {
696
697         int sg_mapped;
698         u64 total_length = 0;
699         struct srp_direct_buf *data =
700                 (struct srp_direct_buf *) srp_cmd->add_data;
701         struct srp_indirect_buf *indirect =
702                 (struct srp_indirect_buf *) data;
703
704         sg_mapped = scsi_dma_map(cmd);
705         if (!sg_mapped)
706                 return 1;
707         else if (sg_mapped < 0)
708                 return 0;
709
710         set_srp_direction(cmd, srp_cmd, sg_mapped);
711
712         /* special case; we can use a single direct descriptor */
713         if (sg_mapped == 1) {
714                 map_sg_list(cmd, sg_mapped, data);
715                 return 1;
716         }
717
718         indirect->table_desc.va = 0;
719         indirect->table_desc.len = cpu_to_be32(sg_mapped *
720                                                sizeof(struct srp_direct_buf));
721         indirect->table_desc.key = 0;
722
723         if (sg_mapped <= MAX_INDIRECT_BUFS) {
724                 total_length = map_sg_list(cmd, sg_mapped,
725                                            &indirect->desc_list[0]);
726                 indirect->len = cpu_to_be32(total_length);
727                 return 1;
728         }
729
730         /* get indirect table */
731         if (!evt_struct->ext_list) {
732                 evt_struct->ext_list = (struct srp_direct_buf *)
733                         dma_alloc_coherent(dev,
734                                            SG_ALL * sizeof(struct srp_direct_buf),
735                                            &evt_struct->ext_list_token, 0);
736                 if (!evt_struct->ext_list) {
737                         if (!firmware_has_feature(FW_FEATURE_CMO))
738                                 sdev_printk(KERN_ERR, cmd->device,
739                                             "Can't allocate memory "
740                                             "for indirect table\n");
741                         scsi_dma_unmap(cmd);
742                         return 0;
743                 }
744         }
745
746         total_length = map_sg_list(cmd, sg_mapped, evt_struct->ext_list);
747
748         indirect->len = cpu_to_be32(total_length);
749         indirect->table_desc.va = cpu_to_be64(evt_struct->ext_list_token);
750         indirect->table_desc.len = cpu_to_be32(sg_mapped *
751                                                sizeof(indirect->desc_list[0]));
752         memcpy(indirect->desc_list, evt_struct->ext_list,
753                MAX_INDIRECT_BUFS * sizeof(struct srp_direct_buf));
754         return 1;
755 }
756
757 /**
758  * map_data_for_srp_cmd: - Calls functions to map data for srp cmds
759  * @cmd:        struct scsi_cmnd with the memory to be mapped
760  * @srp_cmd:    srp_cmd that contains the memory descriptor
761  * @dev:        dma device for which to map dma memory
762  *
763  * Called by scsi_cmd_to_srp_cmd() when converting scsi cmds to srp cmds 
764  * Returns 1 on success.
765 */
766 static int map_data_for_srp_cmd(struct scsi_cmnd *cmd,
767                                 struct srp_event_struct *evt_struct,
768                                 struct srp_cmd *srp_cmd, struct device *dev)
769 {
770         switch (cmd->sc_data_direction) {
771         case DMA_FROM_DEVICE:
772         case DMA_TO_DEVICE:
773                 break;
774         case DMA_NONE:
775                 return 1;
776         case DMA_BIDIRECTIONAL:
777                 sdev_printk(KERN_ERR, cmd->device,
778                             "Can't map DMA_BIDIRECTIONAL to read/write\n");
779                 return 0;
780         default:
781                 sdev_printk(KERN_ERR, cmd->device,
782                             "Unknown data direction 0x%02x; can't map!\n",
783                             cmd->sc_data_direction);
784                 return 0;
785         }
786
787         return map_sg_data(cmd, evt_struct, srp_cmd, dev);
788 }
789
790 /**
791  * purge_requests: Our virtual adapter just shut down.  purge any sent requests
792  * @hostdata:    the adapter
793  */
794 static void purge_requests(struct ibmvscsi_host_data *hostdata, int error_code)
795 {
796         struct srp_event_struct *evt;
797         unsigned long flags;
798
799         spin_lock_irqsave(hostdata->host->host_lock, flags);
800         while (!list_empty(&hostdata->sent)) {
801                 evt = list_first_entry(&hostdata->sent, struct srp_event_struct, list);
802                 list_del(&evt->list);
803                 del_timer(&evt->timer);
804
805                 spin_unlock_irqrestore(hostdata->host->host_lock, flags);
806                 if (evt->cmnd) {
807                         evt->cmnd->result = (error_code << 16);
808                         unmap_cmd_data(&evt->iu.srp.cmd, evt,
809                                        evt->hostdata->dev);
810                         if (evt->cmnd_done)
811                                 evt->cmnd_done(evt->cmnd);
812                 } else if (evt->done && evt->crq.format != VIOSRP_MAD_FORMAT &&
813                            evt->iu.srp.login_req.opcode != SRP_LOGIN_REQ)
814                         evt->done(evt);
815                 free_event_struct(&evt->hostdata->pool, evt);
816                 spin_lock_irqsave(hostdata->host->host_lock, flags);
817         }
818         spin_unlock_irqrestore(hostdata->host->host_lock, flags);
819 }
820
821 /**
822  * ibmvscsi_reset_host - Reset the connection to the server
823  * @hostdata:   struct ibmvscsi_host_data to reset
824 */
825 static void ibmvscsi_reset_host(struct ibmvscsi_host_data *hostdata)
826 {
827         scsi_block_requests(hostdata->host);
828         atomic_set(&hostdata->request_limit, 0);
829
830         purge_requests(hostdata, DID_ERROR);
831         hostdata->reset_crq = 1;
832         wake_up(&hostdata->work_wait_q);
833 }
834
835 /**
836  * ibmvscsi_timeout - Internal command timeout handler
837  * @evt_struct: struct srp_event_struct that timed out
838  *
839  * Called when an internally generated command times out
840 */
841 static void ibmvscsi_timeout(struct timer_list *t)
842 {
843         struct srp_event_struct *evt_struct = from_timer(evt_struct, t, timer);
844         struct ibmvscsi_host_data *hostdata = evt_struct->hostdata;
845
846         dev_err(hostdata->dev, "Command timed out (%x). Resetting connection\n",
847                 evt_struct->iu.srp.cmd.opcode);
848
849         ibmvscsi_reset_host(hostdata);
850 }
851
852
853 /* ------------------------------------------------------------
854  * Routines for sending and receiving SRPs
855  */
856 /**
857  * ibmvscsi_send_srp_event: - Transforms event to u64 array and calls send_crq()
858  * @evt_struct: evt_struct to be sent
859  * @hostdata:   ibmvscsi_host_data of host
860  * @timeout:    timeout in seconds - 0 means do not time command
861  *
862  * Returns the value returned from ibmvscsi_send_crq(). (Zero for success)
863  * Note that this routine assumes that host_lock is held for synchronization
864 */
865 static int ibmvscsi_send_srp_event(struct srp_event_struct *evt_struct,
866                                    struct ibmvscsi_host_data *hostdata,
867                                    unsigned long timeout)
868 {
869         __be64 *crq_as_u64 = (__be64 *)&evt_struct->crq;
870         int request_status = 0;
871         int rc;
872         int srp_req = 0;
873
874         /* If we have exhausted our request limit, just fail this request,
875          * unless it is for a reset or abort.
876          * Note that there are rare cases involving driver generated requests 
877          * (such as task management requests) that the mid layer may think we
878          * can handle more requests (can_queue) when we actually can't
879          */
880         if (evt_struct->crq.format == VIOSRP_SRP_FORMAT) {
881                 srp_req = 1;
882                 request_status =
883                         atomic_dec_if_positive(&hostdata->request_limit);
884                 /* If request limit was -1 when we started, it is now even
885                  * less than that
886                  */
887                 if (request_status < -1)
888                         goto send_error;
889                 /* Otherwise, we may have run out of requests. */
890                 /* If request limit was 0 when we started the adapter is in the
891                  * process of performing a login with the server adapter, or
892                  * we may have run out of requests.
893                  */
894                 else if (request_status == -1 &&
895                          evt_struct->iu.srp.login_req.opcode != SRP_LOGIN_REQ)
896                         goto send_busy;
897                 /* Abort and reset calls should make it through.
898                  * Nothing except abort and reset should use the last two
899                  * slots unless we had two or less to begin with.
900                  */
901                 else if (request_status < 2 &&
902                          evt_struct->iu.srp.cmd.opcode != SRP_TSK_MGMT) {
903                         /* In the case that we have less than two requests
904                          * available, check the server limit as a combination
905                          * of the request limit and the number of requests
906                          * in-flight (the size of the send list).  If the
907                          * server limit is greater than 2, return busy so
908                          * that the last two are reserved for reset and abort.
909                          */
910                         int server_limit = request_status;
911                         struct srp_event_struct *tmp_evt;
912
913                         list_for_each_entry(tmp_evt, &hostdata->sent, list) {
914                                 server_limit++;
915                         }
916
917                         if (server_limit > 2)
918                                 goto send_busy;
919                 }
920         }
921
922         /* Copy the IU into the transfer area */
923         *evt_struct->xfer_iu = evt_struct->iu;
924         evt_struct->xfer_iu->srp.rsp.tag = (u64)evt_struct;
925
926         /* Add this to the sent list.  We need to do this 
927          * before we actually send 
928          * in case it comes back REALLY fast
929          */
930         list_add_tail(&evt_struct->list, &hostdata->sent);
931
932         timer_setup(&evt_struct->timer, ibmvscsi_timeout, 0);
933         if (timeout) {
934                 evt_struct->timer.expires = jiffies + (timeout * HZ);
935                 add_timer(&evt_struct->timer);
936         }
937
938         rc = ibmvscsi_send_crq(hostdata, be64_to_cpu(crq_as_u64[0]),
939                                be64_to_cpu(crq_as_u64[1]));
940         if (rc != 0) {
941                 list_del(&evt_struct->list);
942                 del_timer(&evt_struct->timer);
943
944                 /* If send_crq returns H_CLOSED, return SCSI_MLQUEUE_HOST_BUSY.
945                  * Firmware will send a CRQ with a transport event (0xFF) to
946                  * tell this client what has happened to the transport.  This
947                  * will be handled in ibmvscsi_handle_crq()
948                  */
949                 if (rc == H_CLOSED) {
950                         dev_warn(hostdata->dev, "send warning. "
951                                  "Receive queue closed, will retry.\n");
952                         goto send_busy;
953                 }
954                 dev_err(hostdata->dev, "send error %d\n", rc);
955                 if (srp_req)
956                         atomic_inc(&hostdata->request_limit);
957                 goto send_error;
958         }
959
960         return 0;
961
962  send_busy:
963         unmap_cmd_data(&evt_struct->iu.srp.cmd, evt_struct, hostdata->dev);
964
965         free_event_struct(&hostdata->pool, evt_struct);
966         if (srp_req && request_status != -1)
967                 atomic_inc(&hostdata->request_limit);
968         return SCSI_MLQUEUE_HOST_BUSY;
969
970  send_error:
971         unmap_cmd_data(&evt_struct->iu.srp.cmd, evt_struct, hostdata->dev);
972
973         if (evt_struct->cmnd != NULL) {
974                 evt_struct->cmnd->result = DID_ERROR << 16;
975                 evt_struct->cmnd_done(evt_struct->cmnd);
976         } else if (evt_struct->done)
977                 evt_struct->done(evt_struct);
978
979         free_event_struct(&hostdata->pool, evt_struct);
980         return 0;
981 }
982
983 /**
984  * handle_cmd_rsp: -  Handle responses from commands
985  * @evt_struct: srp_event_struct to be handled
986  *
987  * Used as a callback by when sending scsi cmds.
988  * Gets called by ibmvscsi_handle_crq()
989 */
990 static void handle_cmd_rsp(struct srp_event_struct *evt_struct)
991 {
992         struct srp_rsp *rsp = &evt_struct->xfer_iu->srp.rsp;
993         struct scsi_cmnd *cmnd = evt_struct->cmnd;
994
995         if (unlikely(rsp->opcode != SRP_RSP)) {
996                 if (printk_ratelimit())
997                         dev_warn(evt_struct->hostdata->dev,
998                                  "bad SRP RSP type %#02x\n", rsp->opcode);
999         }
1000         
1001         if (cmnd) {
1002                 cmnd->result |= rsp->status;
1003                 if (((cmnd->result >> 1) & 0x1f) == CHECK_CONDITION)
1004                         memcpy(cmnd->sense_buffer,
1005                                rsp->data,
1006                                be32_to_cpu(rsp->sense_data_len));
1007                 unmap_cmd_data(&evt_struct->iu.srp.cmd, 
1008                                evt_struct, 
1009                                evt_struct->hostdata->dev);
1010
1011                 if (rsp->flags & SRP_RSP_FLAG_DOOVER)
1012                         scsi_set_resid(cmnd,
1013                                        be32_to_cpu(rsp->data_out_res_cnt));
1014                 else if (rsp->flags & SRP_RSP_FLAG_DIOVER)
1015                         scsi_set_resid(cmnd, be32_to_cpu(rsp->data_in_res_cnt));
1016         }
1017
1018         if (evt_struct->cmnd_done)
1019                 evt_struct->cmnd_done(cmnd);
1020 }
1021
1022 /**
1023  * lun_from_dev: - Returns the lun of the scsi device
1024  * @dev:        struct scsi_device
1025  *
1026 */
1027 static inline u16 lun_from_dev(struct scsi_device *dev)
1028 {
1029         return (0x2 << 14) | (dev->id << 8) | (dev->channel << 5) | dev->lun;
1030 }
1031
1032 /**
1033  * ibmvscsi_queue: - The queuecommand function of the scsi template 
1034  * @cmd:        struct scsi_cmnd to be executed
1035  * @done:       Callback function to be called when cmd is completed
1036 */
1037 static int ibmvscsi_queuecommand_lck(struct scsi_cmnd *cmnd,
1038                                  void (*done) (struct scsi_cmnd *))
1039 {
1040         struct srp_cmd *srp_cmd;
1041         struct srp_event_struct *evt_struct;
1042         struct srp_indirect_buf *indirect;
1043         struct ibmvscsi_host_data *hostdata = shost_priv(cmnd->device->host);
1044         u16 lun = lun_from_dev(cmnd->device);
1045         u8 out_fmt, in_fmt;
1046
1047         cmnd->result = (DID_OK << 16);
1048         evt_struct = get_event_struct(&hostdata->pool);
1049         if (!evt_struct)
1050                 return SCSI_MLQUEUE_HOST_BUSY;
1051
1052         /* Set up the actual SRP IU */
1053         srp_cmd = &evt_struct->iu.srp.cmd;
1054         memset(srp_cmd, 0x00, SRP_MAX_IU_LEN);
1055         srp_cmd->opcode = SRP_CMD;
1056         memcpy(srp_cmd->cdb, cmnd->cmnd, sizeof(srp_cmd->cdb));
1057         int_to_scsilun(lun, &srp_cmd->lun);
1058
1059         if (!map_data_for_srp_cmd(cmnd, evt_struct, srp_cmd, hostdata->dev)) {
1060                 if (!firmware_has_feature(FW_FEATURE_CMO))
1061                         sdev_printk(KERN_ERR, cmnd->device,
1062                                     "couldn't convert cmd to srp_cmd\n");
1063                 free_event_struct(&hostdata->pool, evt_struct);
1064                 return SCSI_MLQUEUE_HOST_BUSY;
1065         }
1066
1067         init_event_struct(evt_struct,
1068                           handle_cmd_rsp,
1069                           VIOSRP_SRP_FORMAT,
1070                           cmnd->request->timeout/HZ);
1071
1072         evt_struct->cmnd = cmnd;
1073         evt_struct->cmnd_done = done;
1074
1075         /* Fix up dma address of the buffer itself */
1076         indirect = (struct srp_indirect_buf *) srp_cmd->add_data;
1077         out_fmt = srp_cmd->buf_fmt >> 4;
1078         in_fmt = srp_cmd->buf_fmt & ((1U << 4) - 1);
1079         if ((in_fmt == SRP_DATA_DESC_INDIRECT ||
1080              out_fmt == SRP_DATA_DESC_INDIRECT) &&
1081             indirect->table_desc.va == 0) {
1082                 indirect->table_desc.va =
1083                         cpu_to_be64(be64_to_cpu(evt_struct->crq.IU_data_ptr) +
1084                         offsetof(struct srp_cmd, add_data) +
1085                         offsetof(struct srp_indirect_buf, desc_list));
1086         }
1087
1088         return ibmvscsi_send_srp_event(evt_struct, hostdata, 0);
1089 }
1090
1091 static DEF_SCSI_QCMD(ibmvscsi_queuecommand)
1092
1093 /* ------------------------------------------------------------
1094  * Routines for driver initialization
1095  */
1096
1097 /**
1098  * map_persist_bufs: - Pre-map persistent data for adapter logins
1099  * @hostdata:   ibmvscsi_host_data of host
1100  *
1101  * Map the capabilities and adapter info DMA buffers to avoid runtime failures.
1102  * Return 1 on error, 0 on success.
1103  */
1104 static int map_persist_bufs(struct ibmvscsi_host_data *hostdata)
1105 {
1106
1107         hostdata->caps_addr = dma_map_single(hostdata->dev, &hostdata->caps,
1108                                              sizeof(hostdata->caps), DMA_BIDIRECTIONAL);
1109
1110         if (dma_mapping_error(hostdata->dev, hostdata->caps_addr)) {
1111                 dev_err(hostdata->dev, "Unable to map capabilities buffer!\n");
1112                 return 1;
1113         }
1114
1115         hostdata->adapter_info_addr = dma_map_single(hostdata->dev,
1116                                                      &hostdata->madapter_info,
1117                                                      sizeof(hostdata->madapter_info),
1118                                                      DMA_BIDIRECTIONAL);
1119         if (dma_mapping_error(hostdata->dev, hostdata->adapter_info_addr)) {
1120                 dev_err(hostdata->dev, "Unable to map adapter info buffer!\n");
1121                 dma_unmap_single(hostdata->dev, hostdata->caps_addr,
1122                                  sizeof(hostdata->caps), DMA_BIDIRECTIONAL);
1123                 return 1;
1124         }
1125
1126         return 0;
1127 }
1128
1129 /**
1130  * unmap_persist_bufs: - Unmap persistent data needed for adapter logins
1131  * @hostdata:   ibmvscsi_host_data of host
1132  *
1133  * Unmap the capabilities and adapter info DMA buffers
1134  */
1135 static void unmap_persist_bufs(struct ibmvscsi_host_data *hostdata)
1136 {
1137         dma_unmap_single(hostdata->dev, hostdata->caps_addr,
1138                          sizeof(hostdata->caps), DMA_BIDIRECTIONAL);
1139
1140         dma_unmap_single(hostdata->dev, hostdata->adapter_info_addr,
1141                          sizeof(hostdata->madapter_info), DMA_BIDIRECTIONAL);
1142 }
1143
1144 /**
1145  * login_rsp: - Handle response to SRP login request
1146  * @evt_struct: srp_event_struct with the response
1147  *
1148  * Used as a "done" callback by when sending srp_login. Gets called
1149  * by ibmvscsi_handle_crq()
1150 */
1151 static void login_rsp(struct srp_event_struct *evt_struct)
1152 {
1153         struct ibmvscsi_host_data *hostdata = evt_struct->hostdata;
1154         switch (evt_struct->xfer_iu->srp.login_rsp.opcode) {
1155         case SRP_LOGIN_RSP:     /* it worked! */
1156                 break;
1157         case SRP_LOGIN_REJ:     /* refused! */
1158                 dev_info(hostdata->dev, "SRP_LOGIN_REJ reason %u\n",
1159                          evt_struct->xfer_iu->srp.login_rej.reason);
1160                 /* Login failed.  */
1161                 atomic_set(&hostdata->request_limit, -1);
1162                 return;
1163         default:
1164                 dev_err(hostdata->dev, "Invalid login response typecode 0x%02x!\n",
1165                         evt_struct->xfer_iu->srp.login_rsp.opcode);
1166                 /* Login failed.  */
1167                 atomic_set(&hostdata->request_limit, -1);
1168                 return;
1169         }
1170
1171         dev_info(hostdata->dev, "SRP_LOGIN succeeded\n");
1172         hostdata->client_migrated = 0;
1173
1174         /* Now we know what the real request-limit is.
1175          * This value is set rather than added to request_limit because
1176          * request_limit could have been set to -1 by this client.
1177          */
1178         atomic_set(&hostdata->request_limit,
1179                    be32_to_cpu(evt_struct->xfer_iu->srp.login_rsp.req_lim_delta));
1180
1181         /* If we had any pending I/Os, kick them */
1182         scsi_unblock_requests(hostdata->host);
1183 }
1184
1185 /**
1186  * send_srp_login: - Sends the srp login
1187  * @hostdata:   ibmvscsi_host_data of host
1188  *
1189  * Returns zero if successful.
1190 */
1191 static int send_srp_login(struct ibmvscsi_host_data *hostdata)
1192 {
1193         int rc;
1194         unsigned long flags;
1195         struct srp_login_req *login;
1196         struct srp_event_struct *evt_struct = get_event_struct(&hostdata->pool);
1197
1198         BUG_ON(!evt_struct);
1199         init_event_struct(evt_struct, login_rsp,
1200                           VIOSRP_SRP_FORMAT, login_timeout);
1201
1202         login = &evt_struct->iu.srp.login_req;
1203         memset(login, 0, sizeof(*login));
1204         login->opcode = SRP_LOGIN_REQ;
1205         login->req_it_iu_len = cpu_to_be32(sizeof(union srp_iu));
1206         login->req_buf_fmt = cpu_to_be16(SRP_BUF_FORMAT_DIRECT |
1207                                          SRP_BUF_FORMAT_INDIRECT);
1208
1209         spin_lock_irqsave(hostdata->host->host_lock, flags);
1210         /* Start out with a request limit of 0, since this is negotiated in
1211          * the login request we are just sending and login requests always
1212          * get sent by the driver regardless of request_limit.
1213          */
1214         atomic_set(&hostdata->request_limit, 0);
1215
1216         rc = ibmvscsi_send_srp_event(evt_struct, hostdata, login_timeout * 2);
1217         spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1218         dev_info(hostdata->dev, "sent SRP login\n");
1219         return rc;
1220 };
1221
1222 /**
1223  * capabilities_rsp: - Handle response to MAD adapter capabilities request
1224  * @evt_struct: srp_event_struct with the response
1225  *
1226  * Used as a "done" callback by when sending adapter_info.
1227  */
1228 static void capabilities_rsp(struct srp_event_struct *evt_struct)
1229 {
1230         struct ibmvscsi_host_data *hostdata = evt_struct->hostdata;
1231
1232         if (evt_struct->xfer_iu->mad.capabilities.common.status) {
1233                 dev_err(hostdata->dev, "error 0x%X getting capabilities info\n",
1234                         evt_struct->xfer_iu->mad.capabilities.common.status);
1235         } else {
1236                 if (hostdata->caps.migration.common.server_support !=
1237                     cpu_to_be16(SERVER_SUPPORTS_CAP))
1238                         dev_info(hostdata->dev, "Partition migration not supported\n");
1239
1240                 if (client_reserve) {
1241                         if (hostdata->caps.reserve.common.server_support ==
1242                             cpu_to_be16(SERVER_SUPPORTS_CAP))
1243                                 dev_info(hostdata->dev, "Client reserve enabled\n");
1244                         else
1245                                 dev_info(hostdata->dev, "Client reserve not supported\n");
1246                 }
1247         }
1248
1249         send_srp_login(hostdata);
1250 }
1251
1252 /**
1253  * send_mad_capabilities: - Sends the mad capabilities request
1254  *      and stores the result so it can be retrieved with
1255  * @hostdata:   ibmvscsi_host_data of host
1256  */
1257 static void send_mad_capabilities(struct ibmvscsi_host_data *hostdata)
1258 {
1259         struct viosrp_capabilities *req;
1260         struct srp_event_struct *evt_struct;
1261         unsigned long flags;
1262         struct device_node *of_node = hostdata->dev->of_node;
1263         const char *location;
1264
1265         evt_struct = get_event_struct(&hostdata->pool);
1266         BUG_ON(!evt_struct);
1267
1268         init_event_struct(evt_struct, capabilities_rsp,
1269                           VIOSRP_MAD_FORMAT, info_timeout);
1270
1271         req = &evt_struct->iu.mad.capabilities;
1272         memset(req, 0, sizeof(*req));
1273
1274         hostdata->caps.flags = cpu_to_be32(CAP_LIST_SUPPORTED);
1275         if (hostdata->client_migrated)
1276                 hostdata->caps.flags |= cpu_to_be32(CLIENT_MIGRATED);
1277
1278         strlcpy(hostdata->caps.name, dev_name(&hostdata->host->shost_gendev),
1279                 sizeof(hostdata->caps.name));
1280
1281         location = of_get_property(of_node, "ibm,loc-code", NULL);
1282         location = location ? location : dev_name(hostdata->dev);
1283         strlcpy(hostdata->caps.loc, location, sizeof(hostdata->caps.loc));
1284
1285         req->common.type = cpu_to_be32(VIOSRP_CAPABILITIES_TYPE);
1286         req->buffer = cpu_to_be64(hostdata->caps_addr);
1287
1288         hostdata->caps.migration.common.cap_type =
1289                                 cpu_to_be32(MIGRATION_CAPABILITIES);
1290         hostdata->caps.migration.common.length =
1291                                 cpu_to_be16(sizeof(hostdata->caps.migration));
1292         hostdata->caps.migration.common.server_support =
1293                                 cpu_to_be16(SERVER_SUPPORTS_CAP);
1294         hostdata->caps.migration.ecl = cpu_to_be32(1);
1295
1296         if (client_reserve) {
1297                 hostdata->caps.reserve.common.cap_type =
1298                                         cpu_to_be32(RESERVATION_CAPABILITIES);
1299                 hostdata->caps.reserve.common.length =
1300                                 cpu_to_be16(sizeof(hostdata->caps.reserve));
1301                 hostdata->caps.reserve.common.server_support =
1302                                 cpu_to_be16(SERVER_SUPPORTS_CAP);
1303                 hostdata->caps.reserve.type =
1304                                 cpu_to_be32(CLIENT_RESERVE_SCSI_2);
1305                 req->common.length =
1306                                 cpu_to_be16(sizeof(hostdata->caps));
1307         } else
1308                 req->common.length = cpu_to_be16(sizeof(hostdata->caps) -
1309                                                 sizeof(hostdata->caps.reserve));
1310
1311         spin_lock_irqsave(hostdata->host->host_lock, flags);
1312         if (ibmvscsi_send_srp_event(evt_struct, hostdata, info_timeout * 2))
1313                 dev_err(hostdata->dev, "couldn't send CAPABILITIES_REQ!\n");
1314         spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1315 };
1316
1317 /**
1318  * fast_fail_rsp: - Handle response to MAD enable fast fail
1319  * @evt_struct: srp_event_struct with the response
1320  *
1321  * Used as a "done" callback by when sending enable fast fail. Gets called
1322  * by ibmvscsi_handle_crq()
1323  */
1324 static void fast_fail_rsp(struct srp_event_struct *evt_struct)
1325 {
1326         struct ibmvscsi_host_data *hostdata = evt_struct->hostdata;
1327         u16 status = be16_to_cpu(evt_struct->xfer_iu->mad.fast_fail.common.status);
1328
1329         if (status == VIOSRP_MAD_NOT_SUPPORTED)
1330                 dev_err(hostdata->dev, "fast_fail not supported in server\n");
1331         else if (status == VIOSRP_MAD_FAILED)
1332                 dev_err(hostdata->dev, "fast_fail request failed\n");
1333         else if (status != VIOSRP_MAD_SUCCESS)
1334                 dev_err(hostdata->dev, "error 0x%X enabling fast_fail\n", status);
1335
1336         send_mad_capabilities(hostdata);
1337 }
1338
1339 /**
1340  * init_host - Start host initialization
1341  * @hostdata:   ibmvscsi_host_data of host
1342  *
1343  * Returns zero if successful.
1344  */
1345 static int enable_fast_fail(struct ibmvscsi_host_data *hostdata)
1346 {
1347         int rc;
1348         unsigned long flags;
1349         struct viosrp_fast_fail *fast_fail_mad;
1350         struct srp_event_struct *evt_struct;
1351
1352         if (!fast_fail) {
1353                 send_mad_capabilities(hostdata);
1354                 return 0;
1355         }
1356
1357         evt_struct = get_event_struct(&hostdata->pool);
1358         BUG_ON(!evt_struct);
1359
1360         init_event_struct(evt_struct, fast_fail_rsp, VIOSRP_MAD_FORMAT, info_timeout);
1361
1362         fast_fail_mad = &evt_struct->iu.mad.fast_fail;
1363         memset(fast_fail_mad, 0, sizeof(*fast_fail_mad));
1364         fast_fail_mad->common.type = cpu_to_be32(VIOSRP_ENABLE_FAST_FAIL);
1365         fast_fail_mad->common.length = cpu_to_be16(sizeof(*fast_fail_mad));
1366
1367         spin_lock_irqsave(hostdata->host->host_lock, flags);
1368         rc = ibmvscsi_send_srp_event(evt_struct, hostdata, info_timeout * 2);
1369         spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1370         return rc;
1371 }
1372
1373 /**
1374  * adapter_info_rsp: - Handle response to MAD adapter info request
1375  * @evt_struct: srp_event_struct with the response
1376  *
1377  * Used as a "done" callback by when sending adapter_info. Gets called
1378  * by ibmvscsi_handle_crq()
1379 */
1380 static void adapter_info_rsp(struct srp_event_struct *evt_struct)
1381 {
1382         struct ibmvscsi_host_data *hostdata = evt_struct->hostdata;
1383
1384         if (evt_struct->xfer_iu->mad.adapter_info.common.status) {
1385                 dev_err(hostdata->dev, "error %d getting adapter info\n",
1386                         evt_struct->xfer_iu->mad.adapter_info.common.status);
1387         } else {
1388                 dev_info(hostdata->dev, "host srp version: %s, "
1389                          "host partition %s (%d), OS %d, max io %u\n",
1390                          hostdata->madapter_info.srp_version,
1391                          hostdata->madapter_info.partition_name,
1392                          be32_to_cpu(hostdata->madapter_info.partition_number),
1393                          be32_to_cpu(hostdata->madapter_info.os_type),
1394                          be32_to_cpu(hostdata->madapter_info.port_max_txu[0]));
1395                 
1396                 if (hostdata->madapter_info.port_max_txu[0]) 
1397                         hostdata->host->max_sectors = 
1398                                 be32_to_cpu(hostdata->madapter_info.port_max_txu[0]) >> 9;
1399                 
1400                 if (be32_to_cpu(hostdata->madapter_info.os_type) == SRP_MAD_OS_AIX &&
1401                     strcmp(hostdata->madapter_info.srp_version, "1.6a") <= 0) {
1402                         dev_err(hostdata->dev, "host (Ver. %s) doesn't support large transfers\n",
1403                                 hostdata->madapter_info.srp_version);
1404                         dev_err(hostdata->dev, "limiting scatterlists to %d\n",
1405                                 MAX_INDIRECT_BUFS);
1406                         hostdata->host->sg_tablesize = MAX_INDIRECT_BUFS;
1407                 }
1408
1409                 if (be32_to_cpu(hostdata->madapter_info.os_type) == SRP_MAD_OS_AIX) {
1410                         enable_fast_fail(hostdata);
1411                         return;
1412                 }
1413         }
1414
1415         send_srp_login(hostdata);
1416 }
1417
1418 /**
1419  * send_mad_adapter_info: - Sends the mad adapter info request
1420  *      and stores the result so it can be retrieved with
1421  *      sysfs.  We COULD consider causing a failure if the
1422  *      returned SRP version doesn't match ours.
1423  * @hostdata:   ibmvscsi_host_data of host
1424  * 
1425  * Returns zero if successful.
1426 */
1427 static void send_mad_adapter_info(struct ibmvscsi_host_data *hostdata)
1428 {
1429         struct viosrp_adapter_info *req;
1430         struct srp_event_struct *evt_struct;
1431         unsigned long flags;
1432
1433         evt_struct = get_event_struct(&hostdata->pool);
1434         BUG_ON(!evt_struct);
1435
1436         init_event_struct(evt_struct,
1437                           adapter_info_rsp,
1438                           VIOSRP_MAD_FORMAT,
1439                           info_timeout);
1440         
1441         req = &evt_struct->iu.mad.adapter_info;
1442         memset(req, 0x00, sizeof(*req));
1443         
1444         req->common.type = cpu_to_be32(VIOSRP_ADAPTER_INFO_TYPE);
1445         req->common.length = cpu_to_be16(sizeof(hostdata->madapter_info));
1446         req->buffer = cpu_to_be64(hostdata->adapter_info_addr);
1447
1448         spin_lock_irqsave(hostdata->host->host_lock, flags);
1449         if (ibmvscsi_send_srp_event(evt_struct, hostdata, info_timeout * 2))
1450                 dev_err(hostdata->dev, "couldn't send ADAPTER_INFO_REQ!\n");
1451         spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1452 };
1453
1454 /**
1455  * init_adapter: Start virtual adapter initialization sequence
1456  *
1457  */
1458 static void init_adapter(struct ibmvscsi_host_data *hostdata)
1459 {
1460         send_mad_adapter_info(hostdata);
1461 }
1462
1463 /**
1464  * sync_completion: Signal that a synchronous command has completed
1465  * Note that after returning from this call, the evt_struct is freed.
1466  * the caller waiting on this completion shouldn't touch the evt_struct
1467  * again.
1468  */
1469 static void sync_completion(struct srp_event_struct *evt_struct)
1470 {
1471         /* copy the response back */
1472         if (evt_struct->sync_srp)
1473                 *evt_struct->sync_srp = *evt_struct->xfer_iu;
1474         
1475         complete(&evt_struct->comp);
1476 }
1477
1478 /**
1479  * ibmvscsi_abort: Abort a command...from scsi host template
1480  * send this over to the server and wait synchronously for the response
1481  */
1482 static int ibmvscsi_eh_abort_handler(struct scsi_cmnd *cmd)
1483 {
1484         struct ibmvscsi_host_data *hostdata = shost_priv(cmd->device->host);
1485         struct srp_tsk_mgmt *tsk_mgmt;
1486         struct srp_event_struct *evt;
1487         struct srp_event_struct *tmp_evt, *found_evt;
1488         union viosrp_iu srp_rsp;
1489         int rsp_rc;
1490         unsigned long flags;
1491         u16 lun = lun_from_dev(cmd->device);
1492         unsigned long wait_switch = 0;
1493
1494         /* First, find this command in our sent list so we can figure
1495          * out the correct tag
1496          */
1497         spin_lock_irqsave(hostdata->host->host_lock, flags);
1498         wait_switch = jiffies + (init_timeout * HZ);
1499         do {
1500                 found_evt = NULL;
1501                 list_for_each_entry(tmp_evt, &hostdata->sent, list) {
1502                         if (tmp_evt->cmnd == cmd) {
1503                                 found_evt = tmp_evt;
1504                                 break;
1505                         }
1506                 }
1507
1508                 if (!found_evt) {
1509                         spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1510                         return SUCCESS;
1511                 }
1512
1513                 evt = get_event_struct(&hostdata->pool);
1514                 if (evt == NULL) {
1515                         spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1516                         sdev_printk(KERN_ERR, cmd->device,
1517                                 "failed to allocate abort event\n");
1518                         return FAILED;
1519                 }
1520         
1521                 init_event_struct(evt,
1522                                   sync_completion,
1523                                   VIOSRP_SRP_FORMAT,
1524                                   abort_timeout);
1525
1526                 tsk_mgmt = &evt->iu.srp.tsk_mgmt;
1527         
1528                 /* Set up an abort SRP command */
1529                 memset(tsk_mgmt, 0x00, sizeof(*tsk_mgmt));
1530                 tsk_mgmt->opcode = SRP_TSK_MGMT;
1531                 int_to_scsilun(lun, &tsk_mgmt->lun);
1532                 tsk_mgmt->tsk_mgmt_func = SRP_TSK_ABORT_TASK;
1533                 tsk_mgmt->task_tag = (u64) found_evt;
1534
1535                 evt->sync_srp = &srp_rsp;
1536
1537                 init_completion(&evt->comp);
1538                 rsp_rc = ibmvscsi_send_srp_event(evt, hostdata, abort_timeout * 2);
1539
1540                 if (rsp_rc != SCSI_MLQUEUE_HOST_BUSY)
1541                         break;
1542
1543                 spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1544                 msleep(10);
1545                 spin_lock_irqsave(hostdata->host->host_lock, flags);
1546         } while (time_before(jiffies, wait_switch));
1547
1548         spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1549
1550         if (rsp_rc != 0) {
1551                 sdev_printk(KERN_ERR, cmd->device,
1552                             "failed to send abort() event. rc=%d\n", rsp_rc);
1553                 return FAILED;
1554         }
1555
1556         sdev_printk(KERN_INFO, cmd->device,
1557                     "aborting command. lun 0x%llx, tag 0x%llx\n",
1558                     (((u64) lun) << 48), (u64) found_evt);
1559
1560         wait_for_completion(&evt->comp);
1561
1562         /* make sure we got a good response */
1563         if (unlikely(srp_rsp.srp.rsp.opcode != SRP_RSP)) {
1564                 if (printk_ratelimit())
1565                         sdev_printk(KERN_WARNING, cmd->device, "abort bad SRP RSP type %d\n",
1566                                     srp_rsp.srp.rsp.opcode);
1567                 return FAILED;
1568         }
1569
1570         if (srp_rsp.srp.rsp.flags & SRP_RSP_FLAG_RSPVALID)
1571                 rsp_rc = *((int *)srp_rsp.srp.rsp.data);
1572         else
1573                 rsp_rc = srp_rsp.srp.rsp.status;
1574
1575         if (rsp_rc) {
1576                 if (printk_ratelimit())
1577                         sdev_printk(KERN_WARNING, cmd->device,
1578                                     "abort code %d for task tag 0x%llx\n",
1579                                     rsp_rc, tsk_mgmt->task_tag);
1580                 return FAILED;
1581         }
1582
1583         /* Because we dropped the spinlock above, it's possible
1584          * The event is no longer in our list.  Make sure it didn't
1585          * complete while we were aborting
1586          */
1587         spin_lock_irqsave(hostdata->host->host_lock, flags);
1588         found_evt = NULL;
1589         list_for_each_entry(tmp_evt, &hostdata->sent, list) {
1590                 if (tmp_evt->cmnd == cmd) {
1591                         found_evt = tmp_evt;
1592                         break;
1593                 }
1594         }
1595
1596         if (found_evt == NULL) {
1597                 spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1598                 sdev_printk(KERN_INFO, cmd->device, "aborted task tag 0x%llx completed\n",
1599                             tsk_mgmt->task_tag);
1600                 return SUCCESS;
1601         }
1602
1603         sdev_printk(KERN_INFO, cmd->device, "successfully aborted task tag 0x%llx\n",
1604                     tsk_mgmt->task_tag);
1605
1606         cmd->result = (DID_ABORT << 16);
1607         list_del(&found_evt->list);
1608         unmap_cmd_data(&found_evt->iu.srp.cmd, found_evt,
1609                        found_evt->hostdata->dev);
1610         free_event_struct(&found_evt->hostdata->pool, found_evt);
1611         spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1612         atomic_inc(&hostdata->request_limit);
1613         return SUCCESS;
1614 }
1615
1616 /**
1617  * ibmvscsi_eh_device_reset_handler: Reset a single LUN...from scsi host 
1618  * template send this over to the server and wait synchronously for the 
1619  * response
1620  */
1621 static int ibmvscsi_eh_device_reset_handler(struct scsi_cmnd *cmd)
1622 {
1623         struct ibmvscsi_host_data *hostdata = shost_priv(cmd->device->host);
1624         struct srp_tsk_mgmt *tsk_mgmt;
1625         struct srp_event_struct *evt;
1626         struct srp_event_struct *tmp_evt, *pos;
1627         union viosrp_iu srp_rsp;
1628         int rsp_rc;
1629         unsigned long flags;
1630         u16 lun = lun_from_dev(cmd->device);
1631         unsigned long wait_switch = 0;
1632
1633         spin_lock_irqsave(hostdata->host->host_lock, flags);
1634         wait_switch = jiffies + (init_timeout * HZ);
1635         do {
1636                 evt = get_event_struct(&hostdata->pool);
1637                 if (evt == NULL) {
1638                         spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1639                         sdev_printk(KERN_ERR, cmd->device,
1640                                 "failed to allocate reset event\n");
1641                         return FAILED;
1642                 }
1643         
1644                 init_event_struct(evt,
1645                                   sync_completion,
1646                                   VIOSRP_SRP_FORMAT,
1647                                   reset_timeout);
1648
1649                 tsk_mgmt = &evt->iu.srp.tsk_mgmt;
1650
1651                 /* Set up a lun reset SRP command */
1652                 memset(tsk_mgmt, 0x00, sizeof(*tsk_mgmt));
1653                 tsk_mgmt->opcode = SRP_TSK_MGMT;
1654                 int_to_scsilun(lun, &tsk_mgmt->lun);
1655                 tsk_mgmt->tsk_mgmt_func = SRP_TSK_LUN_RESET;
1656
1657                 evt->sync_srp = &srp_rsp;
1658
1659                 init_completion(&evt->comp);
1660                 rsp_rc = ibmvscsi_send_srp_event(evt, hostdata, reset_timeout * 2);
1661
1662                 if (rsp_rc != SCSI_MLQUEUE_HOST_BUSY)
1663                         break;
1664
1665                 spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1666                 msleep(10);
1667                 spin_lock_irqsave(hostdata->host->host_lock, flags);
1668         } while (time_before(jiffies, wait_switch));
1669
1670         spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1671
1672         if (rsp_rc != 0) {
1673                 sdev_printk(KERN_ERR, cmd->device,
1674                             "failed to send reset event. rc=%d\n", rsp_rc);
1675                 return FAILED;
1676         }
1677
1678         sdev_printk(KERN_INFO, cmd->device, "resetting device. lun 0x%llx\n",
1679                     (((u64) lun) << 48));
1680
1681         wait_for_completion(&evt->comp);
1682
1683         /* make sure we got a good response */
1684         if (unlikely(srp_rsp.srp.rsp.opcode != SRP_RSP)) {
1685                 if (printk_ratelimit())
1686                         sdev_printk(KERN_WARNING, cmd->device, "reset bad SRP RSP type %d\n",
1687                                     srp_rsp.srp.rsp.opcode);
1688                 return FAILED;
1689         }
1690
1691         if (srp_rsp.srp.rsp.flags & SRP_RSP_FLAG_RSPVALID)
1692                 rsp_rc = *((int *)srp_rsp.srp.rsp.data);
1693         else
1694                 rsp_rc = srp_rsp.srp.rsp.status;
1695
1696         if (rsp_rc) {
1697                 if (printk_ratelimit())
1698                         sdev_printk(KERN_WARNING, cmd->device,
1699                                     "reset code %d for task tag 0x%llx\n",
1700                                     rsp_rc, tsk_mgmt->task_tag);
1701                 return FAILED;
1702         }
1703
1704         /* We need to find all commands for this LUN that have not yet been
1705          * responded to, and fail them with DID_RESET
1706          */
1707         spin_lock_irqsave(hostdata->host->host_lock, flags);
1708         list_for_each_entry_safe(tmp_evt, pos, &hostdata->sent, list) {
1709                 if ((tmp_evt->cmnd) && (tmp_evt->cmnd->device == cmd->device)) {
1710                         if (tmp_evt->cmnd)
1711                                 tmp_evt->cmnd->result = (DID_RESET << 16);
1712                         list_del(&tmp_evt->list);
1713                         unmap_cmd_data(&tmp_evt->iu.srp.cmd, tmp_evt,
1714                                        tmp_evt->hostdata->dev);
1715                         free_event_struct(&tmp_evt->hostdata->pool,
1716                                                    tmp_evt);
1717                         atomic_inc(&hostdata->request_limit);
1718                         if (tmp_evt->cmnd_done)
1719                                 tmp_evt->cmnd_done(tmp_evt->cmnd);
1720                         else if (tmp_evt->done)
1721                                 tmp_evt->done(tmp_evt);
1722                 }
1723         }
1724         spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1725         return SUCCESS;
1726 }
1727
1728 /**
1729  * ibmvscsi_eh_host_reset_handler - Reset the connection to the server
1730  * @cmd:        struct scsi_cmnd having problems
1731 */
1732 static int ibmvscsi_eh_host_reset_handler(struct scsi_cmnd *cmd)
1733 {
1734         unsigned long wait_switch = 0;
1735         struct ibmvscsi_host_data *hostdata = shost_priv(cmd->device->host);
1736
1737         dev_err(hostdata->dev, "Resetting connection due to error recovery\n");
1738
1739         ibmvscsi_reset_host(hostdata);
1740
1741         for (wait_switch = jiffies + (init_timeout * HZ);
1742              time_before(jiffies, wait_switch) &&
1743                      atomic_read(&hostdata->request_limit) < 2;) {
1744
1745                 msleep(10);
1746         }
1747
1748         if (atomic_read(&hostdata->request_limit) <= 0)
1749                 return FAILED;
1750
1751         return SUCCESS;
1752 }
1753
1754 /**
1755  * ibmvscsi_handle_crq: - Handles and frees received events in the CRQ
1756  * @crq:        Command/Response queue
1757  * @hostdata:   ibmvscsi_host_data of host
1758  *
1759 */
1760 static void ibmvscsi_handle_crq(struct viosrp_crq *crq,
1761                                 struct ibmvscsi_host_data *hostdata)
1762 {
1763         long rc;
1764         unsigned long flags;
1765         /* The hypervisor copies our tag value here so no byteswapping */
1766         struct srp_event_struct *evt_struct =
1767                         (__force struct srp_event_struct *)crq->IU_data_ptr;
1768         switch (crq->valid) {
1769         case VIOSRP_CRQ_INIT_RSP:               /* initialization */
1770                 switch (crq->format) {
1771                 case VIOSRP_CRQ_INIT:   /* Initialization message */
1772                         dev_info(hostdata->dev, "partner initialized\n");
1773                         /* Send back a response */
1774                         rc = ibmvscsi_send_crq(hostdata, 0xC002000000000000LL, 0);
1775                         if (rc == 0) {
1776                                 /* Now login */
1777                                 init_adapter(hostdata);
1778                         } else {
1779                                 dev_err(hostdata->dev, "Unable to send init rsp. rc=%ld\n", rc);
1780                         }
1781
1782                         break;
1783                 case VIOSRP_CRQ_INIT_COMPLETE:  /* Initialization response */
1784                         dev_info(hostdata->dev, "partner initialization complete\n");
1785
1786                         /* Now login */
1787                         init_adapter(hostdata);
1788                         break;
1789                 default:
1790                         dev_err(hostdata->dev, "unknown crq message type: %d\n", crq->format);
1791                 }
1792                 return;
1793         case VIOSRP_CRQ_XPORT_EVENT:    /* Hypervisor telling us the connection is closed */
1794                 scsi_block_requests(hostdata->host);
1795                 atomic_set(&hostdata->request_limit, 0);
1796                 if (crq->format == 0x06) {
1797                         /* We need to re-setup the interpartition connection */
1798                         dev_info(hostdata->dev, "Re-enabling adapter!\n");
1799                         hostdata->client_migrated = 1;
1800                         hostdata->reenable_crq = 1;
1801                         purge_requests(hostdata, DID_REQUEUE);
1802                         wake_up(&hostdata->work_wait_q);
1803                 } else {
1804                         dev_err(hostdata->dev, "Virtual adapter failed rc %d!\n",
1805                                 crq->format);
1806                         ibmvscsi_reset_host(hostdata);
1807                 }
1808                 return;
1809         case VIOSRP_CRQ_CMD_RSP:                /* real payload */
1810                 break;
1811         default:
1812                 dev_err(hostdata->dev, "got an invalid message type 0x%02x\n",
1813                         crq->valid);
1814                 return;
1815         }
1816
1817         /* The only kind of payload CRQs we should get are responses to
1818          * things we send. Make sure this response is to something we
1819          * actually sent
1820          */
1821         if (!valid_event_struct(&hostdata->pool, evt_struct)) {
1822                 dev_err(hostdata->dev, "returned correlation_token 0x%p is invalid!\n",
1823                        evt_struct);
1824                 return;
1825         }
1826
1827         if (atomic_read(&evt_struct->free)) {
1828                 dev_err(hostdata->dev, "received duplicate correlation_token 0x%p!\n",
1829                         evt_struct);
1830                 return;
1831         }
1832
1833         if (crq->format == VIOSRP_SRP_FORMAT)
1834                 atomic_add(be32_to_cpu(evt_struct->xfer_iu->srp.rsp.req_lim_delta),
1835                            &hostdata->request_limit);
1836
1837         del_timer(&evt_struct->timer);
1838
1839         if ((crq->status != VIOSRP_OK && crq->status != VIOSRP_OK2) && evt_struct->cmnd)
1840                 evt_struct->cmnd->result = DID_ERROR << 16;
1841         if (evt_struct->done)
1842                 evt_struct->done(evt_struct);
1843         else
1844                 dev_err(hostdata->dev, "returned done() is NULL; not running it!\n");
1845
1846         /*
1847          * Lock the host_lock before messing with these structures, since we
1848          * are running in a task context
1849          */
1850         spin_lock_irqsave(evt_struct->hostdata->host->host_lock, flags);
1851         list_del(&evt_struct->list);
1852         free_event_struct(&evt_struct->hostdata->pool, evt_struct);
1853         spin_unlock_irqrestore(evt_struct->hostdata->host->host_lock, flags);
1854 }
1855
1856 /**
1857  * ibmvscsi_slave_configure: Set the "allow_restart" flag for each disk.
1858  * @sdev:       struct scsi_device device to configure
1859  *
1860  * Enable allow_restart for a device if it is a disk.  Adjust the
1861  * queue_depth here also as is required by the documentation for
1862  * struct scsi_host_template.
1863  */
1864 static int ibmvscsi_slave_configure(struct scsi_device *sdev)
1865 {
1866         struct Scsi_Host *shost = sdev->host;
1867         unsigned long lock_flags = 0;
1868
1869         spin_lock_irqsave(shost->host_lock, lock_flags);
1870         if (sdev->type == TYPE_DISK) {
1871                 sdev->allow_restart = 1;
1872                 blk_queue_rq_timeout(sdev->request_queue, 120 * HZ);
1873         }
1874         spin_unlock_irqrestore(shost->host_lock, lock_flags);
1875         return 0;
1876 }
1877
1878 /**
1879  * ibmvscsi_change_queue_depth - Change the device's queue depth
1880  * @sdev:       scsi device struct
1881  * @qdepth:     depth to set
1882  * @reason:     calling context
1883  *
1884  * Return value:
1885  *      actual depth set
1886  **/
1887 static int ibmvscsi_change_queue_depth(struct scsi_device *sdev, int qdepth)
1888 {
1889         if (qdepth > IBMVSCSI_MAX_CMDS_PER_LUN)
1890                 qdepth = IBMVSCSI_MAX_CMDS_PER_LUN;
1891         return scsi_change_queue_depth(sdev, qdepth);
1892 }
1893
1894 /* ------------------------------------------------------------
1895  * sysfs attributes
1896  */
1897 static ssize_t show_host_vhost_loc(struct device *dev,
1898                                    struct device_attribute *attr, char *buf)
1899 {
1900         struct Scsi_Host *shost = class_to_shost(dev);
1901         struct ibmvscsi_host_data *hostdata = shost_priv(shost);
1902         int len;
1903
1904         len = snprintf(buf, sizeof(hostdata->caps.loc), "%s\n",
1905                        hostdata->caps.loc);
1906         return len;
1907 }
1908
1909 static struct device_attribute ibmvscsi_host_vhost_loc = {
1910         .attr = {
1911                  .name = "vhost_loc",
1912                  .mode = S_IRUGO,
1913                  },
1914         .show = show_host_vhost_loc,
1915 };
1916
1917 static ssize_t show_host_vhost_name(struct device *dev,
1918                                     struct device_attribute *attr, char *buf)
1919 {
1920         struct Scsi_Host *shost = class_to_shost(dev);
1921         struct ibmvscsi_host_data *hostdata = shost_priv(shost);
1922         int len;
1923
1924         len = snprintf(buf, sizeof(hostdata->caps.name), "%s\n",
1925                        hostdata->caps.name);
1926         return len;
1927 }
1928
1929 static struct device_attribute ibmvscsi_host_vhost_name = {
1930         .attr = {
1931                  .name = "vhost_name",
1932                  .mode = S_IRUGO,
1933                  },
1934         .show = show_host_vhost_name,
1935 };
1936
1937 static ssize_t show_host_srp_version(struct device *dev,
1938                                      struct device_attribute *attr, char *buf)
1939 {
1940         struct Scsi_Host *shost = class_to_shost(dev);
1941         struct ibmvscsi_host_data *hostdata = shost_priv(shost);
1942         int len;
1943
1944         len = snprintf(buf, PAGE_SIZE, "%s\n",
1945                        hostdata->madapter_info.srp_version);
1946         return len;
1947 }
1948
1949 static struct device_attribute ibmvscsi_host_srp_version = {
1950         .attr = {
1951                  .name = "srp_version",
1952                  .mode = S_IRUGO,
1953                  },
1954         .show = show_host_srp_version,
1955 };
1956
1957 static ssize_t show_host_partition_name(struct device *dev,
1958                                         struct device_attribute *attr,
1959                                         char *buf)
1960 {
1961         struct Scsi_Host *shost = class_to_shost(dev);
1962         struct ibmvscsi_host_data *hostdata = shost_priv(shost);
1963         int len;
1964
1965         len = snprintf(buf, PAGE_SIZE, "%s\n",
1966                        hostdata->madapter_info.partition_name);
1967         return len;
1968 }
1969
1970 static struct device_attribute ibmvscsi_host_partition_name = {
1971         .attr = {
1972                  .name = "partition_name",
1973                  .mode = S_IRUGO,
1974                  },
1975         .show = show_host_partition_name,
1976 };
1977
1978 static ssize_t show_host_partition_number(struct device *dev,
1979                                           struct device_attribute *attr,
1980                                           char *buf)
1981 {
1982         struct Scsi_Host *shost = class_to_shost(dev);
1983         struct ibmvscsi_host_data *hostdata = shost_priv(shost);
1984         int len;
1985
1986         len = snprintf(buf, PAGE_SIZE, "%d\n",
1987                        be32_to_cpu(hostdata->madapter_info.partition_number));
1988         return len;
1989 }
1990
1991 static struct device_attribute ibmvscsi_host_partition_number = {
1992         .attr = {
1993                  .name = "partition_number",
1994                  .mode = S_IRUGO,
1995                  },
1996         .show = show_host_partition_number,
1997 };
1998
1999 static ssize_t show_host_mad_version(struct device *dev,
2000                                      struct device_attribute *attr, char *buf)
2001 {
2002         struct Scsi_Host *shost = class_to_shost(dev);
2003         struct ibmvscsi_host_data *hostdata = shost_priv(shost);
2004         int len;
2005
2006         len = snprintf(buf, PAGE_SIZE, "%d\n",
2007                        be32_to_cpu(hostdata->madapter_info.mad_version));
2008         return len;
2009 }
2010
2011 static struct device_attribute ibmvscsi_host_mad_version = {
2012         .attr = {
2013                  .name = "mad_version",
2014                  .mode = S_IRUGO,
2015                  },
2016         .show = show_host_mad_version,
2017 };
2018
2019 static ssize_t show_host_os_type(struct device *dev,
2020                                  struct device_attribute *attr, char *buf)
2021 {
2022         struct Scsi_Host *shost = class_to_shost(dev);
2023         struct ibmvscsi_host_data *hostdata = shost_priv(shost);
2024         int len;
2025
2026         len = snprintf(buf, PAGE_SIZE, "%d\n",
2027                        be32_to_cpu(hostdata->madapter_info.os_type));
2028         return len;
2029 }
2030
2031 static struct device_attribute ibmvscsi_host_os_type = {
2032         .attr = {
2033                  .name = "os_type",
2034                  .mode = S_IRUGO,
2035                  },
2036         .show = show_host_os_type,
2037 };
2038
2039 static ssize_t show_host_config(struct device *dev,
2040                                 struct device_attribute *attr, char *buf)
2041 {
2042         return 0;
2043 }
2044
2045 static struct device_attribute ibmvscsi_host_config = {
2046         .attr = {
2047                 .name = "config",
2048                 .mode = S_IRUGO,
2049                 },
2050         .show = show_host_config,
2051 };
2052
2053 static struct device_attribute *ibmvscsi_attrs[] = {
2054         &ibmvscsi_host_vhost_loc,
2055         &ibmvscsi_host_vhost_name,
2056         &ibmvscsi_host_srp_version,
2057         &ibmvscsi_host_partition_name,
2058         &ibmvscsi_host_partition_number,
2059         &ibmvscsi_host_mad_version,
2060         &ibmvscsi_host_os_type,
2061         &ibmvscsi_host_config,
2062         NULL
2063 };
2064
2065 /* ------------------------------------------------------------
2066  * SCSI driver registration
2067  */
2068 static struct scsi_host_template driver_template = {
2069         .module = THIS_MODULE,
2070         .name = "IBM POWER Virtual SCSI Adapter " IBMVSCSI_VERSION,
2071         .proc_name = "ibmvscsi",
2072         .queuecommand = ibmvscsi_queuecommand,
2073         .eh_timed_out = srp_timed_out,
2074         .eh_abort_handler = ibmvscsi_eh_abort_handler,
2075         .eh_device_reset_handler = ibmvscsi_eh_device_reset_handler,
2076         .eh_host_reset_handler = ibmvscsi_eh_host_reset_handler,
2077         .slave_configure = ibmvscsi_slave_configure,
2078         .change_queue_depth = ibmvscsi_change_queue_depth,
2079         .cmd_per_lun = IBMVSCSI_CMDS_PER_LUN_DEFAULT,
2080         .can_queue = IBMVSCSI_MAX_REQUESTS_DEFAULT,
2081         .this_id = -1,
2082         .sg_tablesize = SG_ALL,
2083         .shost_attrs = ibmvscsi_attrs,
2084 };
2085
2086 /**
2087  * ibmvscsi_get_desired_dma - Calculate IO memory desired by the driver
2088  *
2089  * @vdev: struct vio_dev for the device whose desired IO mem is to be returned
2090  *
2091  * Return value:
2092  *      Number of bytes of IO data the driver will need to perform well.
2093  */
2094 static unsigned long ibmvscsi_get_desired_dma(struct vio_dev *vdev)
2095 {
2096         /* iu_storage data allocated in initialize_event_pool */
2097         unsigned long desired_io = max_events * sizeof(union viosrp_iu);
2098
2099         /* add io space for sg data */
2100         desired_io += (IBMVSCSI_MAX_SECTORS_DEFAULT * 512 *
2101                              IBMVSCSI_CMDS_PER_LUN_DEFAULT);
2102
2103         return desired_io;
2104 }
2105
2106 static void ibmvscsi_do_work(struct ibmvscsi_host_data *hostdata)
2107 {
2108         int rc;
2109         char *action = "reset";
2110
2111         if (hostdata->reset_crq) {
2112                 smp_rmb();
2113                 hostdata->reset_crq = 0;
2114
2115                 rc = ibmvscsi_reset_crq_queue(&hostdata->queue, hostdata);
2116                 if (!rc)
2117                         rc = ibmvscsi_send_crq(hostdata, 0xC001000000000000LL, 0);
2118                 vio_enable_interrupts(to_vio_dev(hostdata->dev));
2119         } else if (hostdata->reenable_crq) {
2120                 smp_rmb();
2121                 action = "enable";
2122                 rc = ibmvscsi_reenable_crq_queue(&hostdata->queue, hostdata);
2123                 hostdata->reenable_crq = 0;
2124                 if (!rc)
2125                         rc = ibmvscsi_send_crq(hostdata, 0xC001000000000000LL, 0);
2126         } else
2127                 return;
2128
2129         if (rc) {
2130                 atomic_set(&hostdata->request_limit, -1);
2131                 dev_err(hostdata->dev, "error after %s\n", action);
2132         }
2133
2134         scsi_unblock_requests(hostdata->host);
2135 }
2136
2137 static int ibmvscsi_work_to_do(struct ibmvscsi_host_data *hostdata)
2138 {
2139         if (kthread_should_stop())
2140                 return 1;
2141         else if (hostdata->reset_crq) {
2142                 smp_rmb();
2143                 return 1;
2144         } else if (hostdata->reenable_crq) {
2145                 smp_rmb();
2146                 return 1;
2147         }
2148
2149         return 0;
2150 }
2151
2152 static int ibmvscsi_work(void *data)
2153 {
2154         struct ibmvscsi_host_data *hostdata = data;
2155         int rc;
2156
2157         set_user_nice(current, MIN_NICE);
2158
2159         while (1) {
2160                 rc = wait_event_interruptible(hostdata->work_wait_q,
2161                                               ibmvscsi_work_to_do(hostdata));
2162
2163                 BUG_ON(rc);
2164
2165                 if (kthread_should_stop())
2166                         break;
2167
2168                 ibmvscsi_do_work(hostdata);
2169         }
2170
2171         return 0;
2172 }
2173
2174 /**
2175  * Called by bus code for each adapter
2176  */
2177 static int ibmvscsi_probe(struct vio_dev *vdev, const struct vio_device_id *id)
2178 {
2179         struct ibmvscsi_host_data *hostdata;
2180         struct Scsi_Host *host;
2181         struct device *dev = &vdev->dev;
2182         struct srp_rport_identifiers ids;
2183         struct srp_rport *rport;
2184         unsigned long wait_switch = 0;
2185         int rc;
2186
2187         dev_set_drvdata(&vdev->dev, NULL);
2188
2189         host = scsi_host_alloc(&driver_template, sizeof(*hostdata));
2190         if (!host) {
2191                 dev_err(&vdev->dev, "couldn't allocate host data\n");
2192                 goto scsi_host_alloc_failed;
2193         }
2194
2195         host->transportt = ibmvscsi_transport_template;
2196         hostdata = shost_priv(host);
2197         memset(hostdata, 0x00, sizeof(*hostdata));
2198         INIT_LIST_HEAD(&hostdata->sent);
2199         init_waitqueue_head(&hostdata->work_wait_q);
2200         hostdata->host = host;
2201         hostdata->dev = dev;
2202         atomic_set(&hostdata->request_limit, -1);
2203         hostdata->host->max_sectors = IBMVSCSI_MAX_SECTORS_DEFAULT;
2204
2205         if (map_persist_bufs(hostdata)) {
2206                 dev_err(&vdev->dev, "couldn't map persistent buffers\n");
2207                 goto persist_bufs_failed;
2208         }
2209
2210         hostdata->work_thread = kthread_run(ibmvscsi_work, hostdata, "%s_%d",
2211                                             "ibmvscsi", host->host_no);
2212
2213         if (IS_ERR(hostdata->work_thread)) {
2214                 dev_err(&vdev->dev, "couldn't initialize kthread. rc=%ld\n",
2215                         PTR_ERR(hostdata->work_thread));
2216                 goto init_crq_failed;
2217         }
2218
2219         rc = ibmvscsi_init_crq_queue(&hostdata->queue, hostdata, max_events);
2220         if (rc != 0 && rc != H_RESOURCE) {
2221                 dev_err(&vdev->dev, "couldn't initialize crq. rc=%d\n", rc);
2222                 goto kill_kthread;
2223         }
2224         if (initialize_event_pool(&hostdata->pool, max_events, hostdata) != 0) {
2225                 dev_err(&vdev->dev, "couldn't initialize event pool\n");
2226                 goto init_pool_failed;
2227         }
2228
2229         host->max_lun = IBMVSCSI_MAX_LUN;
2230         host->max_id = max_id;
2231         host->max_channel = max_channel;
2232         host->max_cmd_len = 16;
2233
2234         dev_info(dev,
2235                  "Maximum ID: %d Maximum LUN: %llu Maximum Channel: %d\n",
2236                  host->max_id, host->max_lun, host->max_channel);
2237
2238         if (scsi_add_host(hostdata->host, hostdata->dev))
2239                 goto add_host_failed;
2240
2241         /* we don't have a proper target_port_id so let's use the fake one */
2242         memcpy(ids.port_id, hostdata->madapter_info.partition_name,
2243                sizeof(ids.port_id));
2244         ids.roles = SRP_RPORT_ROLE_TARGET;
2245         rport = srp_rport_add(host, &ids);
2246         if (IS_ERR(rport))
2247                 goto add_srp_port_failed;
2248
2249         /* Try to send an initialization message.  Note that this is allowed
2250          * to fail if the other end is not acive.  In that case we don't
2251          * want to scan
2252          */
2253         if (ibmvscsi_send_crq(hostdata, 0xC001000000000000LL, 0) == 0
2254             || rc == H_RESOURCE) {
2255                 /*
2256                  * Wait around max init_timeout secs for the adapter to finish
2257                  * initializing. When we are done initializing, we will have a
2258                  * valid request_limit.  We don't want Linux scanning before
2259                  * we are ready.
2260                  */
2261                 for (wait_switch = jiffies + (init_timeout * HZ);
2262                      time_before(jiffies, wait_switch) &&
2263                      atomic_read(&hostdata->request_limit) < 2;) {
2264
2265                         msleep(10);
2266                 }
2267
2268                 /* if we now have a valid request_limit, initiate a scan */
2269                 if (atomic_read(&hostdata->request_limit) > 0)
2270                         scsi_scan_host(host);
2271         }
2272
2273         dev_set_drvdata(&vdev->dev, hostdata);
2274         spin_lock(&ibmvscsi_driver_lock);
2275         list_add_tail(&hostdata->host_list, &ibmvscsi_head);
2276         spin_unlock(&ibmvscsi_driver_lock);
2277         return 0;
2278
2279       add_srp_port_failed:
2280         scsi_remove_host(hostdata->host);
2281       add_host_failed:
2282         release_event_pool(&hostdata->pool, hostdata);
2283       init_pool_failed:
2284         ibmvscsi_release_crq_queue(&hostdata->queue, hostdata, max_events);
2285       kill_kthread:
2286       kthread_stop(hostdata->work_thread);
2287       init_crq_failed:
2288         unmap_persist_bufs(hostdata);
2289       persist_bufs_failed:
2290         scsi_host_put(host);
2291       scsi_host_alloc_failed:
2292         return -1;
2293 }
2294
2295 static int ibmvscsi_remove(struct vio_dev *vdev)
2296 {
2297         struct ibmvscsi_host_data *hostdata = dev_get_drvdata(&vdev->dev);
2298         unsigned long flags;
2299
2300         srp_remove_host(hostdata->host);
2301         scsi_remove_host(hostdata->host);
2302
2303         purge_requests(hostdata, DID_ERROR);
2304
2305         spin_lock_irqsave(hostdata->host->host_lock, flags);
2306         release_event_pool(&hostdata->pool, hostdata);
2307         spin_unlock_irqrestore(hostdata->host->host_lock, flags);
2308
2309         ibmvscsi_release_crq_queue(&hostdata->queue, hostdata,
2310                                         max_events);
2311
2312         kthread_stop(hostdata->work_thread);
2313         unmap_persist_bufs(hostdata);
2314
2315         spin_lock(&ibmvscsi_driver_lock);
2316         list_del(&hostdata->host_list);
2317         spin_unlock(&ibmvscsi_driver_lock);
2318
2319         scsi_host_put(hostdata->host);
2320
2321         return 0;
2322 }
2323
2324 /**
2325  * ibmvscsi_resume: Resume from suspend
2326  * @dev:        device struct
2327  *
2328  * We may have lost an interrupt across suspend/resume, so kick the
2329  * interrupt handler
2330  */
2331 static int ibmvscsi_resume(struct device *dev)
2332 {
2333         struct ibmvscsi_host_data *hostdata = dev_get_drvdata(dev);
2334         vio_disable_interrupts(to_vio_dev(hostdata->dev));
2335         tasklet_schedule(&hostdata->srp_task);
2336
2337         return 0;
2338 }
2339
2340 /**
2341  * ibmvscsi_device_table: Used by vio.c to match devices in the device tree we 
2342  * support.
2343  */
2344 static const struct vio_device_id ibmvscsi_device_table[] = {
2345         {"vscsi", "IBM,v-scsi"},
2346         { "", "" }
2347 };
2348 MODULE_DEVICE_TABLE(vio, ibmvscsi_device_table);
2349
2350 static const struct dev_pm_ops ibmvscsi_pm_ops = {
2351         .resume = ibmvscsi_resume
2352 };
2353
2354 static struct vio_driver ibmvscsi_driver = {
2355         .id_table = ibmvscsi_device_table,
2356         .probe = ibmvscsi_probe,
2357         .remove = ibmvscsi_remove,
2358         .get_desired_dma = ibmvscsi_get_desired_dma,
2359         .name = "ibmvscsi",
2360         .pm = &ibmvscsi_pm_ops,
2361 };
2362
2363 static struct srp_function_template ibmvscsi_transport_functions = {
2364 };
2365
2366 int __init ibmvscsi_module_init(void)
2367 {
2368         int ret;
2369
2370         /* Ensure we have two requests to do error recovery */
2371         driver_template.can_queue = max_requests;
2372         max_events = max_requests + 2;
2373
2374         if (!firmware_has_feature(FW_FEATURE_VIO))
2375                 return -ENODEV;
2376
2377         ibmvscsi_transport_template =
2378                 srp_attach_transport(&ibmvscsi_transport_functions);
2379         if (!ibmvscsi_transport_template)
2380                 return -ENOMEM;
2381
2382         ret = vio_register_driver(&ibmvscsi_driver);
2383         if (ret)
2384                 srp_release_transport(ibmvscsi_transport_template);
2385         return ret;
2386 }
2387
2388 void __exit ibmvscsi_module_exit(void)
2389 {
2390         vio_unregister_driver(&ibmvscsi_driver);
2391         srp_release_transport(ibmvscsi_transport_template);
2392 }
2393
2394 module_init(ibmvscsi_module_init);
2395 module_exit(ibmvscsi_module_exit);