]> err.no Git - linux-2.6/blob - drivers/scsi/ibmvscsi/ibmvscsi.c
Merge git://git.infradead.org/battery-2.6
[linux-2.6] / drivers / scsi / ibmvscsi / ibmvscsi.c
1 /* ------------------------------------------------------------
2  * ibmvscsi.c
3  * (C) Copyright IBM Corporation 1994, 2004
4  * Authors: Colin DeVilbiss (devilbis@us.ibm.com)
5  *          Santiago Leon (santil@us.ibm.com)
6  *          Dave Boutcher (sleddog@us.ibm.com)
7  *
8  * This program is free software; you can redistribute it and/or modify
9  * it under the terms of the GNU General Public License as published by
10  * the Free Software Foundation; either version 2 of the License, or
11  * (at your option) any later version.
12  *
13  * This program is distributed in the hope that it will be useful,
14  * but WITHOUT ANY WARRANTY; without even the implied warranty of
15  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
16  * GNU General Public License for more details.
17  *
18  * You should have received a copy of the GNU General Public License
19  * along with this program; if not, write to the Free Software
20  * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307
21  * USA
22  *
23  * ------------------------------------------------------------
24  * Emulation of a SCSI host adapter for Virtual I/O devices
25  *
26  * This driver supports the SCSI adapter implemented by the IBM
27  * Power5 firmware.  That SCSI adapter is not a physical adapter,
28  * but allows Linux SCSI peripheral drivers to directly
29  * access devices in another logical partition on the physical system.
30  *
31  * The virtual adapter(s) are present in the open firmware device
32  * tree just like real adapters.
33  *
34  * One of the capabilities provided on these systems is the ability
35  * to DMA between partitions.  The architecture states that for VSCSI,
36  * the server side is allowed to DMA to and from the client.  The client
37  * is never trusted to DMA to or from the server directly.
38  *
39  * Messages are sent between partitions on a "Command/Response Queue" 
40  * (CRQ), which is just a buffer of 16 byte entries in the receiver's 
41  * Senders cannot access the buffer directly, but send messages by
42  * making a hypervisor call and passing in the 16 bytes.  The hypervisor
43  * puts the message in the next 16 byte space in round-robbin fashion,
44  * turns on the high order bit of the message (the valid bit), and 
45  * generates an interrupt to the receiver (if interrupts are turned on.) 
46  * The receiver just turns off the valid bit when they have copied out
47  * the message.
48  *
49  * The VSCSI client builds a SCSI Remote Protocol (SRP) Information Unit
50  * (IU) (as defined in the T10 standard available at www.t10.org), gets 
51  * a DMA address for the message, and sends it to the server as the
52  * payload of a CRQ message.  The server DMAs the SRP IU and processes it,
53  * including doing any additional data transfers.  When it is done, it
54  * DMAs the SRP response back to the same address as the request came from,
55  * and sends a CRQ message back to inform the client that the request has
56  * completed.
57  *
58  * Note that some of the underlying infrastructure is different between
59  * machines conforming to the "RS/6000 Platform Architecture" (RPA) and
60  * the older iSeries hypervisor models.  To support both, some low level
61  * routines have been broken out into rpa_vscsi.c and iseries_vscsi.c.
62  * The Makefile should pick one, not two, not zero, of these.
63  *
64  * TODO: This is currently pretty tied to the IBM i/pSeries hypervisor
65  * interfaces.  It would be really nice to abstract this above an RDMA
66  * layer.
67  */
68
69 #include <linux/module.h>
70 #include <linux/moduleparam.h>
71 #include <linux/dma-mapping.h>
72 #include <linux/delay.h>
73 #include <asm/firmware.h>
74 #include <asm/vio.h>
75 #include <scsi/scsi.h>
76 #include <scsi/scsi_cmnd.h>
77 #include <scsi/scsi_host.h>
78 #include <scsi/scsi_device.h>
79 #include <scsi/scsi_transport_srp.h>
80 #include "ibmvscsi.h"
81
82 /* The values below are somewhat arbitrary default values, but 
83  * OS/400 will use 3 busses (disks, CDs, tapes, I think.)
84  * Note that there are 3 bits of channel value, 6 bits of id, and
85  * 5 bits of LUN.
86  */
87 static int max_id = 64;
88 static int max_channel = 3;
89 static int init_timeout = 5;
90 static int max_requests = IBMVSCSI_MAX_REQUESTS_DEFAULT;
91
92 static struct scsi_transport_template *ibmvscsi_transport_template;
93
94 #define IBMVSCSI_VERSION "1.5.8"
95
96 static struct ibmvscsi_ops *ibmvscsi_ops;
97
98 MODULE_DESCRIPTION("IBM Virtual SCSI");
99 MODULE_AUTHOR("Dave Boutcher");
100 MODULE_LICENSE("GPL");
101 MODULE_VERSION(IBMVSCSI_VERSION);
102
103 module_param_named(max_id, max_id, int, S_IRUGO | S_IWUSR);
104 MODULE_PARM_DESC(max_id, "Largest ID value for each channel");
105 module_param_named(max_channel, max_channel, int, S_IRUGO | S_IWUSR);
106 MODULE_PARM_DESC(max_channel, "Largest channel value");
107 module_param_named(init_timeout, init_timeout, int, S_IRUGO | S_IWUSR);
108 MODULE_PARM_DESC(init_timeout, "Initialization timeout in seconds");
109 module_param_named(max_requests, max_requests, int, S_IRUGO | S_IWUSR);
110 MODULE_PARM_DESC(max_requests, "Maximum requests for this adapter");
111
112 /* ------------------------------------------------------------
113  * Routines for the event pool and event structs
114  */
115 /**
116  * initialize_event_pool: - Allocates and initializes the event pool for a host
117  * @pool:       event_pool to be initialized
118  * @size:       Number of events in pool
119  * @hostdata:   ibmvscsi_host_data who owns the event pool
120  *
121  * Returns zero on success.
122 */
123 static int initialize_event_pool(struct event_pool *pool,
124                                  int size, struct ibmvscsi_host_data *hostdata)
125 {
126         int i;
127
128         pool->size = size;
129         pool->next = 0;
130         pool->events = kcalloc(pool->size, sizeof(*pool->events), GFP_KERNEL);
131         if (!pool->events)
132                 return -ENOMEM;
133
134         pool->iu_storage =
135             dma_alloc_coherent(hostdata->dev,
136                                pool->size * sizeof(*pool->iu_storage),
137                                &pool->iu_token, 0);
138         if (!pool->iu_storage) {
139                 kfree(pool->events);
140                 return -ENOMEM;
141         }
142
143         for (i = 0; i < pool->size; ++i) {
144                 struct srp_event_struct *evt = &pool->events[i];
145                 memset(&evt->crq, 0x00, sizeof(evt->crq));
146                 atomic_set(&evt->free, 1);
147                 evt->crq.valid = 0x80;
148                 evt->crq.IU_length = sizeof(*evt->xfer_iu);
149                 evt->crq.IU_data_ptr = pool->iu_token + 
150                         sizeof(*evt->xfer_iu) * i;
151                 evt->xfer_iu = pool->iu_storage + i;
152                 evt->hostdata = hostdata;
153                 evt->ext_list = NULL;
154                 evt->ext_list_token = 0;
155         }
156
157         return 0;
158 }
159
160 /**
161  * release_event_pool: - Frees memory of an event pool of a host
162  * @pool:       event_pool to be released
163  * @hostdata:   ibmvscsi_host_data who owns the even pool
164  *
165  * Returns zero on success.
166 */
167 static void release_event_pool(struct event_pool *pool,
168                                struct ibmvscsi_host_data *hostdata)
169 {
170         int i, in_use = 0;
171         for (i = 0; i < pool->size; ++i) {
172                 if (atomic_read(&pool->events[i].free) != 1)
173                         ++in_use;
174                 if (pool->events[i].ext_list) {
175                         dma_free_coherent(hostdata->dev,
176                                   SG_ALL * sizeof(struct srp_direct_buf),
177                                   pool->events[i].ext_list,
178                                   pool->events[i].ext_list_token);
179                 }
180         }
181         if (in_use)
182                 dev_warn(hostdata->dev, "releasing event pool with %d "
183                          "events still in use?\n", in_use);
184         kfree(pool->events);
185         dma_free_coherent(hostdata->dev,
186                           pool->size * sizeof(*pool->iu_storage),
187                           pool->iu_storage, pool->iu_token);
188 }
189
190 /**
191  * valid_event_struct: - Determines if event is valid.
192  * @pool:       event_pool that contains the event
193  * @evt:        srp_event_struct to be checked for validity
194  *
195  * Returns zero if event is invalid, one otherwise.
196 */
197 static int valid_event_struct(struct event_pool *pool,
198                                 struct srp_event_struct *evt)
199 {
200         int index = evt - pool->events;
201         if (index < 0 || index >= pool->size)   /* outside of bounds */
202                 return 0;
203         if (evt != pool->events + index)        /* unaligned */
204                 return 0;
205         return 1;
206 }
207
208 /**
209  * ibmvscsi_free-event_struct: - Changes status of event to "free"
210  * @pool:       event_pool that contains the event
211  * @evt:        srp_event_struct to be modified
212  *
213 */
214 static void free_event_struct(struct event_pool *pool,
215                                        struct srp_event_struct *evt)
216 {
217         if (!valid_event_struct(pool, evt)) {
218                 dev_err(evt->hostdata->dev, "Freeing invalid event_struct %p "
219                         "(not in pool %p)\n", evt, pool->events);
220                 return;
221         }
222         if (atomic_inc_return(&evt->free) != 1) {
223                 dev_err(evt->hostdata->dev, "Freeing event_struct %p "
224                         "which is not in use!\n", evt);
225                 return;
226         }
227 }
228
229 /**
230  * get_evt_struct: - Gets the next free event in pool
231  * @pool:       event_pool that contains the events to be searched
232  *
233  * Returns the next event in "free" state, and NULL if none are free.
234  * Note that no synchronization is done here, we assume the host_lock
235  * will syncrhonze things.
236 */
237 static struct srp_event_struct *get_event_struct(struct event_pool *pool)
238 {
239         int i;
240         int poolsize = pool->size;
241         int offset = pool->next;
242
243         for (i = 0; i < poolsize; i++) {
244                 offset = (offset + 1) % poolsize;
245                 if (!atomic_dec_if_positive(&pool->events[offset].free)) {
246                         pool->next = offset;
247                         return &pool->events[offset];
248                 }
249         }
250
251         printk(KERN_ERR "ibmvscsi: found no event struct in pool!\n");
252         return NULL;
253 }
254
255 /**
256  * init_event_struct: Initialize fields in an event struct that are always 
257  *                    required.
258  * @evt:        The event
259  * @done:       Routine to call when the event is responded to
260  * @format:     SRP or MAD format
261  * @timeout:    timeout value set in the CRQ
262  */
263 static void init_event_struct(struct srp_event_struct *evt_struct,
264                               void (*done) (struct srp_event_struct *),
265                               u8 format,
266                               int timeout)
267 {
268         evt_struct->cmnd = NULL;
269         evt_struct->cmnd_done = NULL;
270         evt_struct->sync_srp = NULL;
271         evt_struct->crq.format = format;
272         evt_struct->crq.timeout = timeout;
273         evt_struct->done = done;
274 }
275
276 /* ------------------------------------------------------------
277  * Routines for receiving SCSI responses from the hosting partition
278  */
279
280 /**
281  * set_srp_direction: Set the fields in the srp related to data
282  *     direction and number of buffers based on the direction in
283  *     the scsi_cmnd and the number of buffers
284  */
285 static void set_srp_direction(struct scsi_cmnd *cmd,
286                               struct srp_cmd *srp_cmd, 
287                               int numbuf)
288 {
289         u8 fmt;
290
291         if (numbuf == 0)
292                 return;
293         
294         if (numbuf == 1)
295                 fmt = SRP_DATA_DESC_DIRECT;
296         else {
297                 fmt = SRP_DATA_DESC_INDIRECT;
298                 numbuf = min(numbuf, MAX_INDIRECT_BUFS);
299
300                 if (cmd->sc_data_direction == DMA_TO_DEVICE)
301                         srp_cmd->data_out_desc_cnt = numbuf;
302                 else
303                         srp_cmd->data_in_desc_cnt = numbuf;
304         }
305
306         if (cmd->sc_data_direction == DMA_TO_DEVICE)
307                 srp_cmd->buf_fmt = fmt << 4;
308         else
309                 srp_cmd->buf_fmt = fmt;
310 }
311
312 static void unmap_sg_list(int num_entries,
313                 struct device *dev,
314                 struct srp_direct_buf *md)
315 {
316         int i;
317
318         for (i = 0; i < num_entries; ++i)
319                 dma_unmap_single(dev, md[i].va, md[i].len, DMA_BIDIRECTIONAL);
320 }
321
322 /**
323  * unmap_cmd_data: - Unmap data pointed in srp_cmd based on the format
324  * @cmd:        srp_cmd whose additional_data member will be unmapped
325  * @dev:        device for which the memory is mapped
326  *
327 */
328 static void unmap_cmd_data(struct srp_cmd *cmd,
329                            struct srp_event_struct *evt_struct,
330                            struct device *dev)
331 {
332         u8 out_fmt, in_fmt;
333
334         out_fmt = cmd->buf_fmt >> 4;
335         in_fmt = cmd->buf_fmt & ((1U << 4) - 1);
336
337         if (out_fmt == SRP_NO_DATA_DESC && in_fmt == SRP_NO_DATA_DESC)
338                 return;
339         else if (out_fmt == SRP_DATA_DESC_DIRECT ||
340                  in_fmt == SRP_DATA_DESC_DIRECT) {
341                 struct srp_direct_buf *data =
342                         (struct srp_direct_buf *) cmd->add_data;
343                 dma_unmap_single(dev, data->va, data->len, DMA_BIDIRECTIONAL);
344         } else {
345                 struct srp_indirect_buf *indirect =
346                         (struct srp_indirect_buf *) cmd->add_data;
347                 int num_mapped = indirect->table_desc.len /
348                         sizeof(struct srp_direct_buf);
349
350                 if (num_mapped <= MAX_INDIRECT_BUFS) {
351                         unmap_sg_list(num_mapped, dev, &indirect->desc_list[0]);
352                         return;
353                 }
354
355                 unmap_sg_list(num_mapped, dev, evt_struct->ext_list);
356         }
357 }
358
359 static int map_sg_list(struct scsi_cmnd *cmd, int nseg,
360                        struct srp_direct_buf *md)
361 {
362         int i;
363         struct scatterlist *sg;
364         u64 total_length = 0;
365
366         scsi_for_each_sg(cmd, sg, nseg, i) {
367                 struct srp_direct_buf *descr = md + i;
368                 descr->va = sg_dma_address(sg);
369                 descr->len = sg_dma_len(sg);
370                 descr->key = 0;
371                 total_length += sg_dma_len(sg);
372         }
373         return total_length;
374 }
375
376 /**
377  * map_sg_data: - Maps dma for a scatterlist and initializes decriptor fields
378  * @cmd:        Scsi_Cmnd with the scatterlist
379  * @srp_cmd:    srp_cmd that contains the memory descriptor
380  * @dev:        device for which to map dma memory
381  *
382  * Called by map_data_for_srp_cmd() when building srp cmd from scsi cmd.
383  * Returns 1 on success.
384 */
385 static int map_sg_data(struct scsi_cmnd *cmd,
386                        struct srp_event_struct *evt_struct,
387                        struct srp_cmd *srp_cmd, struct device *dev)
388 {
389
390         int sg_mapped;
391         u64 total_length = 0;
392         struct srp_direct_buf *data =
393                 (struct srp_direct_buf *) srp_cmd->add_data;
394         struct srp_indirect_buf *indirect =
395                 (struct srp_indirect_buf *) data;
396
397         sg_mapped = scsi_dma_map(cmd);
398         if (!sg_mapped)
399                 return 1;
400         else if (sg_mapped < 0)
401                 return 0;
402
403         set_srp_direction(cmd, srp_cmd, sg_mapped);
404
405         /* special case; we can use a single direct descriptor */
406         if (sg_mapped == 1) {
407                 map_sg_list(cmd, sg_mapped, data);
408                 return 1;
409         }
410
411         indirect->table_desc.va = 0;
412         indirect->table_desc.len = sg_mapped * sizeof(struct srp_direct_buf);
413         indirect->table_desc.key = 0;
414
415         if (sg_mapped <= MAX_INDIRECT_BUFS) {
416                 total_length = map_sg_list(cmd, sg_mapped,
417                                            &indirect->desc_list[0]);
418                 indirect->len = total_length;
419                 return 1;
420         }
421
422         /* get indirect table */
423         if (!evt_struct->ext_list) {
424                 evt_struct->ext_list = (struct srp_direct_buf *)
425                         dma_alloc_coherent(dev,
426                                            SG_ALL * sizeof(struct srp_direct_buf),
427                                            &evt_struct->ext_list_token, 0);
428                 if (!evt_struct->ext_list) {
429                         sdev_printk(KERN_ERR, cmd->device,
430                                     "Can't allocate memory for indirect table\n");
431                         return 0;
432                 }
433         }
434
435         total_length = map_sg_list(cmd, sg_mapped, evt_struct->ext_list);
436
437         indirect->len = total_length;
438         indirect->table_desc.va = evt_struct->ext_list_token;
439         indirect->table_desc.len = sg_mapped * sizeof(indirect->desc_list[0]);
440         memcpy(indirect->desc_list, evt_struct->ext_list,
441                MAX_INDIRECT_BUFS * sizeof(struct srp_direct_buf));
442         return 1;
443 }
444
445 /**
446  * map_data_for_srp_cmd: - Calls functions to map data for srp cmds
447  * @cmd:        struct scsi_cmnd with the memory to be mapped
448  * @srp_cmd:    srp_cmd that contains the memory descriptor
449  * @dev:        dma device for which to map dma memory
450  *
451  * Called by scsi_cmd_to_srp_cmd() when converting scsi cmds to srp cmds 
452  * Returns 1 on success.
453 */
454 static int map_data_for_srp_cmd(struct scsi_cmnd *cmd,
455                                 struct srp_event_struct *evt_struct,
456                                 struct srp_cmd *srp_cmd, struct device *dev)
457 {
458         switch (cmd->sc_data_direction) {
459         case DMA_FROM_DEVICE:
460         case DMA_TO_DEVICE:
461                 break;
462         case DMA_NONE:
463                 return 1;
464         case DMA_BIDIRECTIONAL:
465                 sdev_printk(KERN_ERR, cmd->device,
466                             "Can't map DMA_BIDIRECTIONAL to read/write\n");
467                 return 0;
468         default:
469                 sdev_printk(KERN_ERR, cmd->device,
470                             "Unknown data direction 0x%02x; can't map!\n",
471                             cmd->sc_data_direction);
472                 return 0;
473         }
474
475         return map_sg_data(cmd, evt_struct, srp_cmd, dev);
476 }
477
478 /**
479  * purge_requests: Our virtual adapter just shut down.  purge any sent requests
480  * @hostdata:    the adapter
481  */
482 static void purge_requests(struct ibmvscsi_host_data *hostdata, int error_code)
483 {
484         struct srp_event_struct *tmp_evt, *pos;
485         unsigned long flags;
486
487         spin_lock_irqsave(hostdata->host->host_lock, flags);
488         list_for_each_entry_safe(tmp_evt, pos, &hostdata->sent, list) {
489                 list_del(&tmp_evt->list);
490                 del_timer(&tmp_evt->timer);
491                 if (tmp_evt->cmnd) {
492                         tmp_evt->cmnd->result = (error_code << 16);
493                         unmap_cmd_data(&tmp_evt->iu.srp.cmd,
494                                        tmp_evt,
495                                        tmp_evt->hostdata->dev);
496                         if (tmp_evt->cmnd_done)
497                                 tmp_evt->cmnd_done(tmp_evt->cmnd);
498                 } else if (tmp_evt->done)
499                         tmp_evt->done(tmp_evt);
500                 free_event_struct(&tmp_evt->hostdata->pool, tmp_evt);
501         }
502         spin_unlock_irqrestore(hostdata->host->host_lock, flags);
503 }
504
505 /**
506  * ibmvscsi_reset_host - Reset the connection to the server
507  * @hostdata:   struct ibmvscsi_host_data to reset
508 */
509 static void ibmvscsi_reset_host(struct ibmvscsi_host_data *hostdata)
510 {
511         scsi_block_requests(hostdata->host);
512         atomic_set(&hostdata->request_limit, 0);
513
514         purge_requests(hostdata, DID_ERROR);
515         if ((ibmvscsi_ops->reset_crq_queue(&hostdata->queue, hostdata)) ||
516             (ibmvscsi_ops->send_crq(hostdata, 0xC001000000000000LL, 0)) ||
517             (vio_enable_interrupts(to_vio_dev(hostdata->dev)))) {
518                 atomic_set(&hostdata->request_limit, -1);
519                 dev_err(hostdata->dev, "error after reset\n");
520         }
521
522         scsi_unblock_requests(hostdata->host);
523 }
524
525 /**
526  * ibmvscsi_timeout - Internal command timeout handler
527  * @evt_struct: struct srp_event_struct that timed out
528  *
529  * Called when an internally generated command times out
530 */
531 static void ibmvscsi_timeout(struct srp_event_struct *evt_struct)
532 {
533         struct ibmvscsi_host_data *hostdata = evt_struct->hostdata;
534
535         dev_err(hostdata->dev, "Command timed out (%x). Resetting connection\n",
536                 evt_struct->iu.srp.cmd.opcode);
537
538         ibmvscsi_reset_host(hostdata);
539 }
540
541
542 /* ------------------------------------------------------------
543  * Routines for sending and receiving SRPs
544  */
545 /**
546  * ibmvscsi_send_srp_event: - Transforms event to u64 array and calls send_crq()
547  * @evt_struct: evt_struct to be sent
548  * @hostdata:   ibmvscsi_host_data of host
549  * @timeout:    timeout in seconds - 0 means do not time command
550  *
551  * Returns the value returned from ibmvscsi_send_crq(). (Zero for success)
552  * Note that this routine assumes that host_lock is held for synchronization
553 */
554 static int ibmvscsi_send_srp_event(struct srp_event_struct *evt_struct,
555                                    struct ibmvscsi_host_data *hostdata,
556                                    unsigned long timeout)
557 {
558         u64 *crq_as_u64 = (u64 *) &evt_struct->crq;
559         int request_status = 0;
560         int rc;
561
562         /* If we have exhausted our request limit, just fail this request,
563          * unless it is for a reset or abort.
564          * Note that there are rare cases involving driver generated requests 
565          * (such as task management requests) that the mid layer may think we
566          * can handle more requests (can_queue) when we actually can't
567          */
568         if (evt_struct->crq.format == VIOSRP_SRP_FORMAT) {
569                 request_status =
570                         atomic_dec_if_positive(&hostdata->request_limit);
571                 /* If request limit was -1 when we started, it is now even
572                  * less than that
573                  */
574                 if (request_status < -1)
575                         goto send_error;
576                 /* Otherwise, we may have run out of requests. */
577                 /* If request limit was 0 when we started the adapter is in the
578                  * process of performing a login with the server adapter, or
579                  * we may have run out of requests.
580                  */
581                 else if (request_status == -1 &&
582                          evt_struct->iu.srp.login_req.opcode != SRP_LOGIN_REQ)
583                         goto send_busy;
584                 /* Abort and reset calls should make it through.
585                  * Nothing except abort and reset should use the last two
586                  * slots unless we had two or less to begin with.
587                  */
588                 else if (request_status < 2 &&
589                          evt_struct->iu.srp.cmd.opcode != SRP_TSK_MGMT) {
590                         /* In the case that we have less than two requests
591                          * available, check the server limit as a combination
592                          * of the request limit and the number of requests
593                          * in-flight (the size of the send list).  If the
594                          * server limit is greater than 2, return busy so
595                          * that the last two are reserved for reset and abort.
596                          */
597                         int server_limit = request_status;
598                         struct srp_event_struct *tmp_evt;
599
600                         list_for_each_entry(tmp_evt, &hostdata->sent, list) {
601                                 server_limit++;
602                         }
603
604                         if (server_limit > 2)
605                                 goto send_busy;
606                 }
607         }
608
609         /* Copy the IU into the transfer area */
610         *evt_struct->xfer_iu = evt_struct->iu;
611         evt_struct->xfer_iu->srp.rsp.tag = (u64)evt_struct;
612
613         /* Add this to the sent list.  We need to do this 
614          * before we actually send 
615          * in case it comes back REALLY fast
616          */
617         list_add_tail(&evt_struct->list, &hostdata->sent);
618
619         init_timer(&evt_struct->timer);
620         if (timeout) {
621                 evt_struct->timer.data = (unsigned long) evt_struct;
622                 evt_struct->timer.expires = jiffies + (timeout * HZ);
623                 evt_struct->timer.function = (void (*)(unsigned long))ibmvscsi_timeout;
624                 add_timer(&evt_struct->timer);
625         }
626
627         if ((rc =
628              ibmvscsi_ops->send_crq(hostdata, crq_as_u64[0], crq_as_u64[1])) != 0) {
629                 list_del(&evt_struct->list);
630                 del_timer(&evt_struct->timer);
631
632                 /* If send_crq returns H_CLOSED, return SCSI_MLQUEUE_HOST_BUSY.
633                  * Firmware will send a CRQ with a transport event (0xFF) to
634                  * tell this client what has happened to the transport.  This
635                  * will be handled in ibmvscsi_handle_crq()
636                  */
637                 if (rc == H_CLOSED) {
638                         dev_warn(hostdata->dev, "send warning. "
639                                  "Receive queue closed, will retry.\n");
640                         goto send_busy;
641                 }
642                 dev_err(hostdata->dev, "send error %d\n", rc);
643                 atomic_inc(&hostdata->request_limit);
644                 goto send_error;
645         }
646
647         return 0;
648
649  send_busy:
650         unmap_cmd_data(&evt_struct->iu.srp.cmd, evt_struct, hostdata->dev);
651
652         free_event_struct(&hostdata->pool, evt_struct);
653         if (request_status != -1)
654                 atomic_inc(&hostdata->request_limit);
655         return SCSI_MLQUEUE_HOST_BUSY;
656
657  send_error:
658         unmap_cmd_data(&evt_struct->iu.srp.cmd, evt_struct, hostdata->dev);
659
660         if (evt_struct->cmnd != NULL) {
661                 evt_struct->cmnd->result = DID_ERROR << 16;
662                 evt_struct->cmnd_done(evt_struct->cmnd);
663         } else if (evt_struct->done)
664                 evt_struct->done(evt_struct);
665
666         free_event_struct(&hostdata->pool, evt_struct);
667         return 0;
668 }
669
670 /**
671  * handle_cmd_rsp: -  Handle responses from commands
672  * @evt_struct: srp_event_struct to be handled
673  *
674  * Used as a callback by when sending scsi cmds.
675  * Gets called by ibmvscsi_handle_crq()
676 */
677 static void handle_cmd_rsp(struct srp_event_struct *evt_struct)
678 {
679         struct srp_rsp *rsp = &evt_struct->xfer_iu->srp.rsp;
680         struct scsi_cmnd *cmnd = evt_struct->cmnd;
681
682         if (unlikely(rsp->opcode != SRP_RSP)) {
683                 if (printk_ratelimit())
684                         dev_warn(evt_struct->hostdata->dev,
685                                  "bad SRP RSP type %d\n", rsp->opcode);
686         }
687         
688         if (cmnd) {
689                 cmnd->result |= rsp->status;
690                 if (((cmnd->result >> 1) & 0x1f) == CHECK_CONDITION)
691                         memcpy(cmnd->sense_buffer,
692                                rsp->data,
693                                rsp->sense_data_len);
694                 unmap_cmd_data(&evt_struct->iu.srp.cmd, 
695                                evt_struct, 
696                                evt_struct->hostdata->dev);
697
698                 if (rsp->flags & SRP_RSP_FLAG_DOOVER)
699                         scsi_set_resid(cmnd, rsp->data_out_res_cnt);
700                 else if (rsp->flags & SRP_RSP_FLAG_DIOVER)
701                         scsi_set_resid(cmnd, rsp->data_in_res_cnt);
702         }
703
704         if (evt_struct->cmnd_done)
705                 evt_struct->cmnd_done(cmnd);
706 }
707
708 /**
709  * lun_from_dev: - Returns the lun of the scsi device
710  * @dev:        struct scsi_device
711  *
712 */
713 static inline u16 lun_from_dev(struct scsi_device *dev)
714 {
715         return (0x2 << 14) | (dev->id << 8) | (dev->channel << 5) | dev->lun;
716 }
717
718 /**
719  * ibmvscsi_queue: - The queuecommand function of the scsi template 
720  * @cmd:        struct scsi_cmnd to be executed
721  * @done:       Callback function to be called when cmd is completed
722 */
723 static int ibmvscsi_queuecommand(struct scsi_cmnd *cmnd,
724                                  void (*done) (struct scsi_cmnd *))
725 {
726         struct srp_cmd *srp_cmd;
727         struct srp_event_struct *evt_struct;
728         struct srp_indirect_buf *indirect;
729         struct ibmvscsi_host_data *hostdata = shost_priv(cmnd->device->host);
730         u16 lun = lun_from_dev(cmnd->device);
731         u8 out_fmt, in_fmt;
732
733         cmnd->result = (DID_OK << 16);
734         evt_struct = get_event_struct(&hostdata->pool);
735         if (!evt_struct)
736                 return SCSI_MLQUEUE_HOST_BUSY;
737
738         /* Set up the actual SRP IU */
739         srp_cmd = &evt_struct->iu.srp.cmd;
740         memset(srp_cmd, 0x00, SRP_MAX_IU_LEN);
741         srp_cmd->opcode = SRP_CMD;
742         memcpy(srp_cmd->cdb, cmnd->cmnd, sizeof(srp_cmd->cdb));
743         srp_cmd->lun = ((u64) lun) << 48;
744
745         if (!map_data_for_srp_cmd(cmnd, evt_struct, srp_cmd, hostdata->dev)) {
746                 sdev_printk(KERN_ERR, cmnd->device, "couldn't convert cmd to srp_cmd\n");
747                 free_event_struct(&hostdata->pool, evt_struct);
748                 return SCSI_MLQUEUE_HOST_BUSY;
749         }
750
751         init_event_struct(evt_struct,
752                           handle_cmd_rsp,
753                           VIOSRP_SRP_FORMAT,
754                           cmnd->timeout_per_command/HZ);
755
756         evt_struct->cmnd = cmnd;
757         evt_struct->cmnd_done = done;
758
759         /* Fix up dma address of the buffer itself */
760         indirect = (struct srp_indirect_buf *) srp_cmd->add_data;
761         out_fmt = srp_cmd->buf_fmt >> 4;
762         in_fmt = srp_cmd->buf_fmt & ((1U << 4) - 1);
763         if ((in_fmt == SRP_DATA_DESC_INDIRECT ||
764              out_fmt == SRP_DATA_DESC_INDIRECT) &&
765             indirect->table_desc.va == 0) {
766                 indirect->table_desc.va = evt_struct->crq.IU_data_ptr +
767                         offsetof(struct srp_cmd, add_data) +
768                         offsetof(struct srp_indirect_buf, desc_list);
769         }
770
771         return ibmvscsi_send_srp_event(evt_struct, hostdata, 0);
772 }
773
774 /* ------------------------------------------------------------
775  * Routines for driver initialization
776  */
777 /**
778  * adapter_info_rsp: - Handle response to MAD adapter info request
779  * @evt_struct: srp_event_struct with the response
780  *
781  * Used as a "done" callback by when sending adapter_info. Gets called
782  * by ibmvscsi_handle_crq()
783 */
784 static void adapter_info_rsp(struct srp_event_struct *evt_struct)
785 {
786         struct ibmvscsi_host_data *hostdata = evt_struct->hostdata;
787         dma_unmap_single(hostdata->dev,
788                          evt_struct->iu.mad.adapter_info.buffer,
789                          evt_struct->iu.mad.adapter_info.common.length,
790                          DMA_BIDIRECTIONAL);
791
792         if (evt_struct->xfer_iu->mad.adapter_info.common.status) {
793                 dev_err(hostdata->dev, "error %d getting adapter info\n",
794                         evt_struct->xfer_iu->mad.adapter_info.common.status);
795         } else {
796                 dev_info(hostdata->dev, "host srp version: %s, "
797                          "host partition %s (%d), OS %d, max io %u\n",
798                          hostdata->madapter_info.srp_version,
799                          hostdata->madapter_info.partition_name,
800                          hostdata->madapter_info.partition_number,
801                          hostdata->madapter_info.os_type,
802                          hostdata->madapter_info.port_max_txu[0]);
803                 
804                 if (hostdata->madapter_info.port_max_txu[0]) 
805                         hostdata->host->max_sectors = 
806                                 hostdata->madapter_info.port_max_txu[0] >> 9;
807                 
808                 if (hostdata->madapter_info.os_type == 3 &&
809                     strcmp(hostdata->madapter_info.srp_version, "1.6a") <= 0) {
810                         dev_err(hostdata->dev, "host (Ver. %s) doesn't support large transfers\n",
811                                 hostdata->madapter_info.srp_version);
812                         dev_err(hostdata->dev, "limiting scatterlists to %d\n",
813                                 MAX_INDIRECT_BUFS);
814                         hostdata->host->sg_tablesize = MAX_INDIRECT_BUFS;
815                 }
816         }
817 }
818
819 /**
820  * send_mad_adapter_info: - Sends the mad adapter info request
821  *      and stores the result so it can be retrieved with
822  *      sysfs.  We COULD consider causing a failure if the
823  *      returned SRP version doesn't match ours.
824  * @hostdata:   ibmvscsi_host_data of host
825  * 
826  * Returns zero if successful.
827 */
828 static void send_mad_adapter_info(struct ibmvscsi_host_data *hostdata)
829 {
830         struct viosrp_adapter_info *req;
831         struct srp_event_struct *evt_struct;
832         unsigned long flags;
833         dma_addr_t addr;
834
835         evt_struct = get_event_struct(&hostdata->pool);
836         if (!evt_struct) {
837                 dev_err(hostdata->dev,
838                         "couldn't allocate an event for ADAPTER_INFO_REQ!\n");
839                 return;
840         }
841
842         init_event_struct(evt_struct,
843                           adapter_info_rsp,
844                           VIOSRP_MAD_FORMAT,
845                           init_timeout);
846         
847         req = &evt_struct->iu.mad.adapter_info;
848         memset(req, 0x00, sizeof(*req));
849         
850         req->common.type = VIOSRP_ADAPTER_INFO_TYPE;
851         req->common.length = sizeof(hostdata->madapter_info);
852         req->buffer = addr = dma_map_single(hostdata->dev,
853                                             &hostdata->madapter_info,
854                                             sizeof(hostdata->madapter_info),
855                                             DMA_BIDIRECTIONAL);
856
857         if (dma_mapping_error(req->buffer)) {
858                 dev_err(hostdata->dev, "Unable to map request_buffer for adapter_info!\n");
859                 free_event_struct(&hostdata->pool, evt_struct);
860                 return;
861         }
862         
863         spin_lock_irqsave(hostdata->host->host_lock, flags);
864         if (ibmvscsi_send_srp_event(evt_struct, hostdata, init_timeout * 2)) {
865                 dev_err(hostdata->dev, "couldn't send ADAPTER_INFO_REQ!\n");
866                 dma_unmap_single(hostdata->dev,
867                                  addr,
868                                  sizeof(hostdata->madapter_info),
869                                  DMA_BIDIRECTIONAL);
870         }
871         spin_unlock_irqrestore(hostdata->host->host_lock, flags);
872 };
873
874 /**
875  * login_rsp: - Handle response to SRP login request
876  * @evt_struct: srp_event_struct with the response
877  *
878  * Used as a "done" callback by when sending srp_login. Gets called
879  * by ibmvscsi_handle_crq()
880 */
881 static void login_rsp(struct srp_event_struct *evt_struct)
882 {
883         struct ibmvscsi_host_data *hostdata = evt_struct->hostdata;
884         switch (evt_struct->xfer_iu->srp.login_rsp.opcode) {
885         case SRP_LOGIN_RSP:     /* it worked! */
886                 break;
887         case SRP_LOGIN_REJ:     /* refused! */
888                 dev_info(hostdata->dev, "SRP_LOGIN_REJ reason %u\n",
889                          evt_struct->xfer_iu->srp.login_rej.reason);
890                 /* Login failed.  */
891                 atomic_set(&hostdata->request_limit, -1);
892                 return;
893         default:
894                 dev_err(hostdata->dev, "Invalid login response typecode 0x%02x!\n",
895                         evt_struct->xfer_iu->srp.login_rsp.opcode);
896                 /* Login failed.  */
897                 atomic_set(&hostdata->request_limit, -1);
898                 return;
899         }
900
901         dev_info(hostdata->dev, "SRP_LOGIN succeeded\n");
902
903         if (evt_struct->xfer_iu->srp.login_rsp.req_lim_delta < 0)
904                 dev_err(hostdata->dev, "Invalid request_limit.\n");
905
906         /* Now we know what the real request-limit is.
907          * This value is set rather than added to request_limit because
908          * request_limit could have been set to -1 by this client.
909          */
910         atomic_set(&hostdata->request_limit,
911                    evt_struct->xfer_iu->srp.login_rsp.req_lim_delta);
912
913         /* If we had any pending I/Os, kick them */
914         scsi_unblock_requests(hostdata->host);
915
916         send_mad_adapter_info(hostdata);
917         return;
918 }
919
920 /**
921  * send_srp_login: - Sends the srp login
922  * @hostdata:   ibmvscsi_host_data of host
923  * 
924  * Returns zero if successful.
925 */
926 static int send_srp_login(struct ibmvscsi_host_data *hostdata)
927 {
928         int rc;
929         unsigned long flags;
930         struct srp_login_req *login;
931         struct srp_event_struct *evt_struct = get_event_struct(&hostdata->pool);
932         if (!evt_struct) {
933                 dev_err(hostdata->dev, "couldn't allocate an event for login req!\n");
934                 return FAILED;
935         }
936
937         init_event_struct(evt_struct,
938                           login_rsp,
939                           VIOSRP_SRP_FORMAT,
940                           init_timeout);
941
942         login = &evt_struct->iu.srp.login_req;
943         memset(login, 0x00, sizeof(struct srp_login_req));
944         login->opcode = SRP_LOGIN_REQ;
945         login->req_it_iu_len = sizeof(union srp_iu);
946         login->req_buf_fmt = SRP_BUF_FORMAT_DIRECT | SRP_BUF_FORMAT_INDIRECT;
947         
948         spin_lock_irqsave(hostdata->host->host_lock, flags);
949         /* Start out with a request limit of 0, since this is negotiated in
950          * the login request we are just sending and login requests always
951          * get sent by the driver regardless of request_limit.
952          */
953         atomic_set(&hostdata->request_limit, 0);
954
955         rc = ibmvscsi_send_srp_event(evt_struct, hostdata, init_timeout * 2);
956         spin_unlock_irqrestore(hostdata->host->host_lock, flags);
957         dev_info(hostdata->dev, "sent SRP login\n");
958         return rc;
959 };
960
961 /**
962  * sync_completion: Signal that a synchronous command has completed
963  * Note that after returning from this call, the evt_struct is freed.
964  * the caller waiting on this completion shouldn't touch the evt_struct
965  * again.
966  */
967 static void sync_completion(struct srp_event_struct *evt_struct)
968 {
969         /* copy the response back */
970         if (evt_struct->sync_srp)
971                 *evt_struct->sync_srp = *evt_struct->xfer_iu;
972         
973         complete(&evt_struct->comp);
974 }
975
976 /**
977  * ibmvscsi_abort: Abort a command...from scsi host template
978  * send this over to the server and wait synchronously for the response
979  */
980 static int ibmvscsi_eh_abort_handler(struct scsi_cmnd *cmd)
981 {
982         struct ibmvscsi_host_data *hostdata = shost_priv(cmd->device->host);
983         struct srp_tsk_mgmt *tsk_mgmt;
984         struct srp_event_struct *evt;
985         struct srp_event_struct *tmp_evt, *found_evt;
986         union viosrp_iu srp_rsp;
987         int rsp_rc;
988         unsigned long flags;
989         u16 lun = lun_from_dev(cmd->device);
990         unsigned long wait_switch = 0;
991
992         /* First, find this command in our sent list so we can figure
993          * out the correct tag
994          */
995         spin_lock_irqsave(hostdata->host->host_lock, flags);
996         wait_switch = jiffies + (init_timeout * HZ);
997         do {
998                 found_evt = NULL;
999                 list_for_each_entry(tmp_evt, &hostdata->sent, list) {
1000                         if (tmp_evt->cmnd == cmd) {
1001                                 found_evt = tmp_evt;
1002                                 break;
1003                         }
1004                 }
1005
1006                 if (!found_evt) {
1007                         spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1008                         return SUCCESS;
1009                 }
1010
1011                 evt = get_event_struct(&hostdata->pool);
1012                 if (evt == NULL) {
1013                         spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1014                         sdev_printk(KERN_ERR, cmd->device,
1015                                 "failed to allocate abort event\n");
1016                         return FAILED;
1017                 }
1018         
1019                 init_event_struct(evt,
1020                                   sync_completion,
1021                                   VIOSRP_SRP_FORMAT,
1022                                   init_timeout);
1023
1024                 tsk_mgmt = &evt->iu.srp.tsk_mgmt;
1025         
1026                 /* Set up an abort SRP command */
1027                 memset(tsk_mgmt, 0x00, sizeof(*tsk_mgmt));
1028                 tsk_mgmt->opcode = SRP_TSK_MGMT;
1029                 tsk_mgmt->lun = ((u64) lun) << 48;
1030                 tsk_mgmt->tsk_mgmt_func = SRP_TSK_ABORT_TASK;
1031                 tsk_mgmt->task_tag = (u64) found_evt;
1032
1033                 evt->sync_srp = &srp_rsp;
1034
1035                 init_completion(&evt->comp);
1036                 rsp_rc = ibmvscsi_send_srp_event(evt, hostdata, init_timeout * 2);
1037
1038                 if (rsp_rc != SCSI_MLQUEUE_HOST_BUSY)
1039                         break;
1040
1041                 spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1042                 msleep(10);
1043                 spin_lock_irqsave(hostdata->host->host_lock, flags);
1044         } while (time_before(jiffies, wait_switch));
1045
1046         spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1047
1048         if (rsp_rc != 0) {
1049                 sdev_printk(KERN_ERR, cmd->device,
1050                             "failed to send abort() event. rc=%d\n", rsp_rc);
1051                 return FAILED;
1052         }
1053
1054         sdev_printk(KERN_INFO, cmd->device,
1055                     "aborting command. lun 0x%lx, tag 0x%lx\n",
1056                     (((u64) lun) << 48), (u64) found_evt);
1057
1058         wait_for_completion(&evt->comp);
1059
1060         /* make sure we got a good response */
1061         if (unlikely(srp_rsp.srp.rsp.opcode != SRP_RSP)) {
1062                 if (printk_ratelimit())
1063                         sdev_printk(KERN_WARNING, cmd->device, "abort bad SRP RSP type %d\n",
1064                                     srp_rsp.srp.rsp.opcode);
1065                 return FAILED;
1066         }
1067
1068         if (srp_rsp.srp.rsp.flags & SRP_RSP_FLAG_RSPVALID)
1069                 rsp_rc = *((int *)srp_rsp.srp.rsp.data);
1070         else
1071                 rsp_rc = srp_rsp.srp.rsp.status;
1072
1073         if (rsp_rc) {
1074                 if (printk_ratelimit())
1075                         sdev_printk(KERN_WARNING, cmd->device,
1076                                     "abort code %d for task tag 0x%lx\n",
1077                                     rsp_rc, tsk_mgmt->task_tag);
1078                 return FAILED;
1079         }
1080
1081         /* Because we dropped the spinlock above, it's possible
1082          * The event is no longer in our list.  Make sure it didn't
1083          * complete while we were aborting
1084          */
1085         spin_lock_irqsave(hostdata->host->host_lock, flags);
1086         found_evt = NULL;
1087         list_for_each_entry(tmp_evt, &hostdata->sent, list) {
1088                 if (tmp_evt->cmnd == cmd) {
1089                         found_evt = tmp_evt;
1090                         break;
1091                 }
1092         }
1093
1094         if (found_evt == NULL) {
1095                 spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1096                 sdev_printk(KERN_INFO, cmd->device, "aborted task tag 0x%lx completed\n",
1097                             tsk_mgmt->task_tag);
1098                 return SUCCESS;
1099         }
1100
1101         sdev_printk(KERN_INFO, cmd->device, "successfully aborted task tag 0x%lx\n",
1102                     tsk_mgmt->task_tag);
1103
1104         cmd->result = (DID_ABORT << 16);
1105         list_del(&found_evt->list);
1106         unmap_cmd_data(&found_evt->iu.srp.cmd, found_evt,
1107                        found_evt->hostdata->dev);
1108         free_event_struct(&found_evt->hostdata->pool, found_evt);
1109         spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1110         atomic_inc(&hostdata->request_limit);
1111         return SUCCESS;
1112 }
1113
1114 /**
1115  * ibmvscsi_eh_device_reset_handler: Reset a single LUN...from scsi host 
1116  * template send this over to the server and wait synchronously for the 
1117  * response
1118  */
1119 static int ibmvscsi_eh_device_reset_handler(struct scsi_cmnd *cmd)
1120 {
1121         struct ibmvscsi_host_data *hostdata = shost_priv(cmd->device->host);
1122         struct srp_tsk_mgmt *tsk_mgmt;
1123         struct srp_event_struct *evt;
1124         struct srp_event_struct *tmp_evt, *pos;
1125         union viosrp_iu srp_rsp;
1126         int rsp_rc;
1127         unsigned long flags;
1128         u16 lun = lun_from_dev(cmd->device);
1129         unsigned long wait_switch = 0;
1130
1131         spin_lock_irqsave(hostdata->host->host_lock, flags);
1132         wait_switch = jiffies + (init_timeout * HZ);
1133         do {
1134                 evt = get_event_struct(&hostdata->pool);
1135                 if (evt == NULL) {
1136                         spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1137                         sdev_printk(KERN_ERR, cmd->device,
1138                                 "failed to allocate reset event\n");
1139                         return FAILED;
1140                 }
1141         
1142                 init_event_struct(evt,
1143                                   sync_completion,
1144                                   VIOSRP_SRP_FORMAT,
1145                                   init_timeout);
1146
1147                 tsk_mgmt = &evt->iu.srp.tsk_mgmt;
1148
1149                 /* Set up a lun reset SRP command */
1150                 memset(tsk_mgmt, 0x00, sizeof(*tsk_mgmt));
1151                 tsk_mgmt->opcode = SRP_TSK_MGMT;
1152                 tsk_mgmt->lun = ((u64) lun) << 48;
1153                 tsk_mgmt->tsk_mgmt_func = SRP_TSK_LUN_RESET;
1154
1155                 evt->sync_srp = &srp_rsp;
1156
1157                 init_completion(&evt->comp);
1158                 rsp_rc = ibmvscsi_send_srp_event(evt, hostdata, init_timeout * 2);
1159
1160                 if (rsp_rc != SCSI_MLQUEUE_HOST_BUSY)
1161                         break;
1162
1163                 spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1164                 msleep(10);
1165                 spin_lock_irqsave(hostdata->host->host_lock, flags);
1166         } while (time_before(jiffies, wait_switch));
1167
1168         spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1169
1170         if (rsp_rc != 0) {
1171                 sdev_printk(KERN_ERR, cmd->device,
1172                             "failed to send reset event. rc=%d\n", rsp_rc);
1173                 return FAILED;
1174         }
1175
1176         sdev_printk(KERN_INFO, cmd->device, "resetting device. lun 0x%lx\n",
1177                     (((u64) lun) << 48));
1178
1179         wait_for_completion(&evt->comp);
1180
1181         /* make sure we got a good response */
1182         if (unlikely(srp_rsp.srp.rsp.opcode != SRP_RSP)) {
1183                 if (printk_ratelimit())
1184                         sdev_printk(KERN_WARNING, cmd->device, "reset bad SRP RSP type %d\n",
1185                                     srp_rsp.srp.rsp.opcode);
1186                 return FAILED;
1187         }
1188
1189         if (srp_rsp.srp.rsp.flags & SRP_RSP_FLAG_RSPVALID)
1190                 rsp_rc = *((int *)srp_rsp.srp.rsp.data);
1191         else
1192                 rsp_rc = srp_rsp.srp.rsp.status;
1193
1194         if (rsp_rc) {
1195                 if (printk_ratelimit())
1196                         sdev_printk(KERN_WARNING, cmd->device,
1197                                     "reset code %d for task tag 0x%lx\n",
1198                                     rsp_rc, tsk_mgmt->task_tag);
1199                 return FAILED;
1200         }
1201
1202         /* We need to find all commands for this LUN that have not yet been
1203          * responded to, and fail them with DID_RESET
1204          */
1205         spin_lock_irqsave(hostdata->host->host_lock, flags);
1206         list_for_each_entry_safe(tmp_evt, pos, &hostdata->sent, list) {
1207                 if ((tmp_evt->cmnd) && (tmp_evt->cmnd->device == cmd->device)) {
1208                         if (tmp_evt->cmnd)
1209                                 tmp_evt->cmnd->result = (DID_RESET << 16);
1210                         list_del(&tmp_evt->list);
1211                         unmap_cmd_data(&tmp_evt->iu.srp.cmd, tmp_evt,
1212                                        tmp_evt->hostdata->dev);
1213                         free_event_struct(&tmp_evt->hostdata->pool,
1214                                                    tmp_evt);
1215                         atomic_inc(&hostdata->request_limit);
1216                         if (tmp_evt->cmnd_done)
1217                                 tmp_evt->cmnd_done(tmp_evt->cmnd);
1218                         else if (tmp_evt->done)
1219                                 tmp_evt->done(tmp_evt);
1220                 }
1221         }
1222         spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1223         return SUCCESS;
1224 }
1225
1226 /**
1227  * ibmvscsi_eh_host_reset_handler - Reset the connection to the server
1228  * @cmd:        struct scsi_cmnd having problems
1229 */
1230 static int ibmvscsi_eh_host_reset_handler(struct scsi_cmnd *cmd)
1231 {
1232         unsigned long wait_switch = 0;
1233         struct ibmvscsi_host_data *hostdata = shost_priv(cmd->device->host);
1234
1235         dev_err(hostdata->dev, "Resetting connection due to error recovery\n");
1236
1237         ibmvscsi_reset_host(hostdata);
1238
1239         for (wait_switch = jiffies + (init_timeout * HZ);
1240              time_before(jiffies, wait_switch) &&
1241                      atomic_read(&hostdata->request_limit) < 2;) {
1242
1243                 msleep(10);
1244         }
1245
1246         if (atomic_read(&hostdata->request_limit) <= 0)
1247                 return FAILED;
1248
1249         return SUCCESS;
1250 }
1251
1252 /**
1253  * ibmvscsi_handle_crq: - Handles and frees received events in the CRQ
1254  * @crq:        Command/Response queue
1255  * @hostdata:   ibmvscsi_host_data of host
1256  *
1257 */
1258 void ibmvscsi_handle_crq(struct viosrp_crq *crq,
1259                          struct ibmvscsi_host_data *hostdata)
1260 {
1261         long rc;
1262         unsigned long flags;
1263         struct srp_event_struct *evt_struct =
1264             (struct srp_event_struct *)crq->IU_data_ptr;
1265         switch (crq->valid) {
1266         case 0xC0:              /* initialization */
1267                 switch (crq->format) {
1268                 case 0x01:      /* Initialization message */
1269                         dev_info(hostdata->dev, "partner initialized\n");
1270                         /* Send back a response */
1271                         if ((rc = ibmvscsi_ops->send_crq(hostdata,
1272                                                          0xC002000000000000LL, 0)) == 0) {
1273                                 /* Now login */
1274                                 send_srp_login(hostdata);
1275                         } else {
1276                                 dev_err(hostdata->dev, "Unable to send init rsp. rc=%ld\n", rc);
1277                         }
1278
1279                         break;
1280                 case 0x02:      /* Initialization response */
1281                         dev_info(hostdata->dev, "partner initialization complete\n");
1282
1283                         /* Now login */
1284                         send_srp_login(hostdata);
1285                         break;
1286                 default:
1287                         dev_err(hostdata->dev, "unknown crq message type: %d\n", crq->format);
1288                 }
1289                 return;
1290         case 0xFF:      /* Hypervisor telling us the connection is closed */
1291                 scsi_block_requests(hostdata->host);
1292                 atomic_set(&hostdata->request_limit, 0);
1293                 if (crq->format == 0x06) {
1294                         /* We need to re-setup the interpartition connection */
1295                         dev_info(hostdata->dev, "Re-enabling adapter!\n");
1296                         purge_requests(hostdata, DID_REQUEUE);
1297                         if ((ibmvscsi_ops->reenable_crq_queue(&hostdata->queue,
1298                                                               hostdata)) ||
1299                             (ibmvscsi_ops->send_crq(hostdata,
1300                                                     0xC001000000000000LL, 0))) {
1301                                         atomic_set(&hostdata->request_limit,
1302                                                    -1);
1303                                         dev_err(hostdata->dev, "error after enable\n");
1304                         }
1305                 } else {
1306                         dev_err(hostdata->dev, "Virtual adapter failed rc %d!\n",
1307                                 crq->format);
1308
1309                         purge_requests(hostdata, DID_ERROR);
1310                         if ((ibmvscsi_ops->reset_crq_queue(&hostdata->queue,
1311                                                            hostdata)) ||
1312                             (ibmvscsi_ops->send_crq(hostdata,
1313                                                     0xC001000000000000LL, 0))) {
1314                                         atomic_set(&hostdata->request_limit,
1315                                                    -1);
1316                                         dev_err(hostdata->dev, "error after reset\n");
1317                         }
1318                 }
1319                 scsi_unblock_requests(hostdata->host);
1320                 return;
1321         case 0x80:              /* real payload */
1322                 break;
1323         default:
1324                 dev_err(hostdata->dev, "got an invalid message type 0x%02x\n",
1325                         crq->valid);
1326                 return;
1327         }
1328
1329         /* The only kind of payload CRQs we should get are responses to
1330          * things we send. Make sure this response is to something we
1331          * actually sent
1332          */
1333         if (!valid_event_struct(&hostdata->pool, evt_struct)) {
1334                 dev_err(hostdata->dev, "returned correlation_token 0x%p is invalid!\n",
1335                        (void *)crq->IU_data_ptr);
1336                 return;
1337         }
1338
1339         if (atomic_read(&evt_struct->free)) {
1340                 dev_err(hostdata->dev, "received duplicate correlation_token 0x%p!\n",
1341                         (void *)crq->IU_data_ptr);
1342                 return;
1343         }
1344
1345         if (crq->format == VIOSRP_SRP_FORMAT)
1346                 atomic_add(evt_struct->xfer_iu->srp.rsp.req_lim_delta,
1347                            &hostdata->request_limit);
1348
1349         del_timer(&evt_struct->timer);
1350
1351         if (crq->status != VIOSRP_OK && evt_struct->cmnd)
1352                 evt_struct->cmnd->result = DID_ERROR << 16;
1353         if (evt_struct->done)
1354                 evt_struct->done(evt_struct);
1355         else
1356                 dev_err(hostdata->dev, "returned done() is NULL; not running it!\n");
1357
1358         /*
1359          * Lock the host_lock before messing with these structures, since we
1360          * are running in a task context
1361          */
1362         spin_lock_irqsave(evt_struct->hostdata->host->host_lock, flags);
1363         list_del(&evt_struct->list);
1364         free_event_struct(&evt_struct->hostdata->pool, evt_struct);
1365         spin_unlock_irqrestore(evt_struct->hostdata->host->host_lock, flags);
1366 }
1367
1368 /**
1369  * ibmvscsi_get_host_config: Send the command to the server to get host
1370  * configuration data.  The data is opaque to us.
1371  */
1372 static int ibmvscsi_do_host_config(struct ibmvscsi_host_data *hostdata,
1373                                    unsigned char *buffer, int length)
1374 {
1375         struct viosrp_host_config *host_config;
1376         struct srp_event_struct *evt_struct;
1377         unsigned long flags;
1378         dma_addr_t addr;
1379         int rc;
1380
1381         evt_struct = get_event_struct(&hostdata->pool);
1382         if (!evt_struct) {
1383                 dev_err(hostdata->dev, "couldn't allocate event for HOST_CONFIG!\n");
1384                 return -1;
1385         }
1386
1387         init_event_struct(evt_struct,
1388                           sync_completion,
1389                           VIOSRP_MAD_FORMAT,
1390                           init_timeout);
1391
1392         host_config = &evt_struct->iu.mad.host_config;
1393
1394         /* Set up a lun reset SRP command */
1395         memset(host_config, 0x00, sizeof(*host_config));
1396         host_config->common.type = VIOSRP_HOST_CONFIG_TYPE;
1397         host_config->common.length = length;
1398         host_config->buffer = addr = dma_map_single(hostdata->dev, buffer,
1399                                                     length,
1400                                                     DMA_BIDIRECTIONAL);
1401
1402         if (dma_mapping_error(host_config->buffer)) {
1403                 dev_err(hostdata->dev, "dma_mapping error getting host config\n");
1404                 free_event_struct(&hostdata->pool, evt_struct);
1405                 return -1;
1406         }
1407
1408         init_completion(&evt_struct->comp);
1409         spin_lock_irqsave(hostdata->host->host_lock, flags);
1410         rc = ibmvscsi_send_srp_event(evt_struct, hostdata, init_timeout * 2);
1411         spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1412         if (rc == 0)
1413                 wait_for_completion(&evt_struct->comp);
1414         dma_unmap_single(hostdata->dev, addr, length, DMA_BIDIRECTIONAL);
1415
1416         return rc;
1417 }
1418
1419 /**
1420  * ibmvscsi_slave_configure: Set the "allow_restart" flag for each disk.
1421  * @sdev:       struct scsi_device device to configure
1422  *
1423  * Enable allow_restart for a device if it is a disk.  Adjust the
1424  * queue_depth here also as is required by the documentation for
1425  * struct scsi_host_template.
1426  */
1427 static int ibmvscsi_slave_configure(struct scsi_device *sdev)
1428 {
1429         struct Scsi_Host *shost = sdev->host;
1430         unsigned long lock_flags = 0;
1431
1432         spin_lock_irqsave(shost->host_lock, lock_flags);
1433         if (sdev->type == TYPE_DISK) {
1434                 sdev->allow_restart = 1;
1435                 sdev->timeout = 60 * HZ;
1436         }
1437         scsi_adjust_queue_depth(sdev, 0, shost->cmd_per_lun);
1438         spin_unlock_irqrestore(shost->host_lock, lock_flags);
1439         return 0;
1440 }
1441
1442 /**
1443  * ibmvscsi_change_queue_depth - Change the device's queue depth
1444  * @sdev:       scsi device struct
1445  * @qdepth:     depth to set
1446  *
1447  * Return value:
1448  *      actual depth set
1449  **/
1450 static int ibmvscsi_change_queue_depth(struct scsi_device *sdev, int qdepth)
1451 {
1452         if (qdepth > IBMVSCSI_MAX_CMDS_PER_LUN)
1453                 qdepth = IBMVSCSI_MAX_CMDS_PER_LUN;
1454
1455         scsi_adjust_queue_depth(sdev, 0, qdepth);
1456         return sdev->queue_depth;
1457 }
1458
1459 /* ------------------------------------------------------------
1460  * sysfs attributes
1461  */
1462 static ssize_t show_host_srp_version(struct device *dev,
1463                                      struct device_attribute *attr, char *buf)
1464 {
1465         struct Scsi_Host *shost = class_to_shost(dev);
1466         struct ibmvscsi_host_data *hostdata = shost_priv(shost);
1467         int len;
1468
1469         len = snprintf(buf, PAGE_SIZE, "%s\n",
1470                        hostdata->madapter_info.srp_version);
1471         return len;
1472 }
1473
1474 static struct device_attribute ibmvscsi_host_srp_version = {
1475         .attr = {
1476                  .name = "srp_version",
1477                  .mode = S_IRUGO,
1478                  },
1479         .show = show_host_srp_version,
1480 };
1481
1482 static ssize_t show_host_partition_name(struct device *dev,
1483                                         struct device_attribute *attr,
1484                                         char *buf)
1485 {
1486         struct Scsi_Host *shost = class_to_shost(dev);
1487         struct ibmvscsi_host_data *hostdata = shost_priv(shost);
1488         int len;
1489
1490         len = snprintf(buf, PAGE_SIZE, "%s\n",
1491                        hostdata->madapter_info.partition_name);
1492         return len;
1493 }
1494
1495 static struct device_attribute ibmvscsi_host_partition_name = {
1496         .attr = {
1497                  .name = "partition_name",
1498                  .mode = S_IRUGO,
1499                  },
1500         .show = show_host_partition_name,
1501 };
1502
1503 static ssize_t show_host_partition_number(struct device *dev,
1504                                           struct device_attribute *attr,
1505                                           char *buf)
1506 {
1507         struct Scsi_Host *shost = class_to_shost(dev);
1508         struct ibmvscsi_host_data *hostdata = shost_priv(shost);
1509         int len;
1510
1511         len = snprintf(buf, PAGE_SIZE, "%d\n",
1512                        hostdata->madapter_info.partition_number);
1513         return len;
1514 }
1515
1516 static struct device_attribute ibmvscsi_host_partition_number = {
1517         .attr = {
1518                  .name = "partition_number",
1519                  .mode = S_IRUGO,
1520                  },
1521         .show = show_host_partition_number,
1522 };
1523
1524 static ssize_t show_host_mad_version(struct device *dev,
1525                                      struct device_attribute *attr, char *buf)
1526 {
1527         struct Scsi_Host *shost = class_to_shost(dev);
1528         struct ibmvscsi_host_data *hostdata = shost_priv(shost);
1529         int len;
1530
1531         len = snprintf(buf, PAGE_SIZE, "%d\n",
1532                        hostdata->madapter_info.mad_version);
1533         return len;
1534 }
1535
1536 static struct device_attribute ibmvscsi_host_mad_version = {
1537         .attr = {
1538                  .name = "mad_version",
1539                  .mode = S_IRUGO,
1540                  },
1541         .show = show_host_mad_version,
1542 };
1543
1544 static ssize_t show_host_os_type(struct device *dev,
1545                                  struct device_attribute *attr, char *buf)
1546 {
1547         struct Scsi_Host *shost = class_to_shost(dev);
1548         struct ibmvscsi_host_data *hostdata = shost_priv(shost);
1549         int len;
1550
1551         len = snprintf(buf, PAGE_SIZE, "%d\n", hostdata->madapter_info.os_type);
1552         return len;
1553 }
1554
1555 static struct device_attribute ibmvscsi_host_os_type = {
1556         .attr = {
1557                  .name = "os_type",
1558                  .mode = S_IRUGO,
1559                  },
1560         .show = show_host_os_type,
1561 };
1562
1563 static ssize_t show_host_config(struct device *dev,
1564                                 struct device_attribute *attr, char *buf)
1565 {
1566         struct Scsi_Host *shost = class_to_shost(dev);
1567         struct ibmvscsi_host_data *hostdata = shost_priv(shost);
1568
1569         /* returns null-terminated host config data */
1570         if (ibmvscsi_do_host_config(hostdata, buf, PAGE_SIZE) == 0)
1571                 return strlen(buf);
1572         else
1573                 return 0;
1574 }
1575
1576 static struct device_attribute ibmvscsi_host_config = {
1577         .attr = {
1578                  .name = "config",
1579                  .mode = S_IRUGO,
1580                  },
1581         .show = show_host_config,
1582 };
1583
1584 static struct device_attribute *ibmvscsi_attrs[] = {
1585         &ibmvscsi_host_srp_version,
1586         &ibmvscsi_host_partition_name,
1587         &ibmvscsi_host_partition_number,
1588         &ibmvscsi_host_mad_version,
1589         &ibmvscsi_host_os_type,
1590         &ibmvscsi_host_config,
1591         NULL
1592 };
1593
1594 /* ------------------------------------------------------------
1595  * SCSI driver registration
1596  */
1597 static struct scsi_host_template driver_template = {
1598         .module = THIS_MODULE,
1599         .name = "IBM POWER Virtual SCSI Adapter " IBMVSCSI_VERSION,
1600         .proc_name = "ibmvscsi",
1601         .queuecommand = ibmvscsi_queuecommand,
1602         .eh_abort_handler = ibmvscsi_eh_abort_handler,
1603         .eh_device_reset_handler = ibmvscsi_eh_device_reset_handler,
1604         .eh_host_reset_handler = ibmvscsi_eh_host_reset_handler,
1605         .slave_configure = ibmvscsi_slave_configure,
1606         .change_queue_depth = ibmvscsi_change_queue_depth,
1607         .cmd_per_lun = 16,
1608         .can_queue = IBMVSCSI_MAX_REQUESTS_DEFAULT,
1609         .this_id = -1,
1610         .sg_tablesize = SG_ALL,
1611         .use_clustering = ENABLE_CLUSTERING,
1612         .shost_attrs = ibmvscsi_attrs,
1613 };
1614
1615 /**
1616  * Called by bus code for each adapter
1617  */
1618 static int ibmvscsi_probe(struct vio_dev *vdev, const struct vio_device_id *id)
1619 {
1620         struct ibmvscsi_host_data *hostdata;
1621         struct Scsi_Host *host;
1622         struct device *dev = &vdev->dev;
1623         struct srp_rport_identifiers ids;
1624         struct srp_rport *rport;
1625         unsigned long wait_switch = 0;
1626         int rc;
1627
1628         vdev->dev.driver_data = NULL;
1629
1630         driver_template.can_queue = max_requests;
1631         host = scsi_host_alloc(&driver_template, sizeof(*hostdata));
1632         if (!host) {
1633                 dev_err(&vdev->dev, "couldn't allocate host data\n");
1634                 goto scsi_host_alloc_failed;
1635         }
1636
1637         host->transportt = ibmvscsi_transport_template;
1638         hostdata = shost_priv(host);
1639         memset(hostdata, 0x00, sizeof(*hostdata));
1640         INIT_LIST_HEAD(&hostdata->sent);
1641         hostdata->host = host;
1642         hostdata->dev = dev;
1643         atomic_set(&hostdata->request_limit, -1);
1644         hostdata->host->max_sectors = 32 * 8; /* default max I/O 32 pages */
1645
1646         rc = ibmvscsi_ops->init_crq_queue(&hostdata->queue, hostdata, max_requests);
1647         if (rc != 0 && rc != H_RESOURCE) {
1648                 dev_err(&vdev->dev, "couldn't initialize crq. rc=%d\n", rc);
1649                 goto init_crq_failed;
1650         }
1651         if (initialize_event_pool(&hostdata->pool, max_requests, hostdata) != 0) {
1652                 dev_err(&vdev->dev, "couldn't initialize event pool\n");
1653                 goto init_pool_failed;
1654         }
1655
1656         host->max_lun = 8;
1657         host->max_id = max_id;
1658         host->max_channel = max_channel;
1659
1660         if (scsi_add_host(hostdata->host, hostdata->dev))
1661                 goto add_host_failed;
1662
1663         /* we don't have a proper target_port_id so let's use the fake one */
1664         memcpy(ids.port_id, hostdata->madapter_info.partition_name,
1665                sizeof(ids.port_id));
1666         ids.roles = SRP_RPORT_ROLE_TARGET;
1667         rport = srp_rport_add(host, &ids);
1668         if (IS_ERR(rport))
1669                 goto add_srp_port_failed;
1670
1671         /* Try to send an initialization message.  Note that this is allowed
1672          * to fail if the other end is not acive.  In that case we don't
1673          * want to scan
1674          */
1675         if (ibmvscsi_ops->send_crq(hostdata, 0xC001000000000000LL, 0) == 0
1676             || rc == H_RESOURCE) {
1677                 /*
1678                  * Wait around max init_timeout secs for the adapter to finish
1679                  * initializing. When we are done initializing, we will have a
1680                  * valid request_limit.  We don't want Linux scanning before
1681                  * we are ready.
1682                  */
1683                 for (wait_switch = jiffies + (init_timeout * HZ);
1684                      time_before(jiffies, wait_switch) &&
1685                      atomic_read(&hostdata->request_limit) < 2;) {
1686
1687                         msleep(10);
1688                 }
1689
1690                 /* if we now have a valid request_limit, initiate a scan */
1691                 if (atomic_read(&hostdata->request_limit) > 0)
1692                         scsi_scan_host(host);
1693         }
1694
1695         vdev->dev.driver_data = hostdata;
1696         return 0;
1697
1698       add_srp_port_failed:
1699         scsi_remove_host(hostdata->host);
1700       add_host_failed:
1701         release_event_pool(&hostdata->pool, hostdata);
1702       init_pool_failed:
1703         ibmvscsi_ops->release_crq_queue(&hostdata->queue, hostdata, max_requests);
1704       init_crq_failed:
1705         scsi_host_put(host);
1706       scsi_host_alloc_failed:
1707         return -1;
1708 }
1709
1710 static int ibmvscsi_remove(struct vio_dev *vdev)
1711 {
1712         struct ibmvscsi_host_data *hostdata = vdev->dev.driver_data;
1713         release_event_pool(&hostdata->pool, hostdata);
1714         ibmvscsi_ops->release_crq_queue(&hostdata->queue, hostdata,
1715                                         max_requests);
1716
1717         srp_remove_host(hostdata->host);
1718         scsi_remove_host(hostdata->host);
1719         scsi_host_put(hostdata->host);
1720
1721         return 0;
1722 }
1723
1724 /**
1725  * ibmvscsi_device_table: Used by vio.c to match devices in the device tree we 
1726  * support.
1727  */
1728 static struct vio_device_id ibmvscsi_device_table[] __devinitdata = {
1729         {"vscsi", "IBM,v-scsi"},
1730         { "", "" }
1731 };
1732 MODULE_DEVICE_TABLE(vio, ibmvscsi_device_table);
1733
1734 static struct vio_driver ibmvscsi_driver = {
1735         .id_table = ibmvscsi_device_table,
1736         .probe = ibmvscsi_probe,
1737         .remove = ibmvscsi_remove,
1738         .driver = {
1739                 .name = "ibmvscsi",
1740                 .owner = THIS_MODULE,
1741         }
1742 };
1743
1744 static struct srp_function_template ibmvscsi_transport_functions = {
1745 };
1746
1747 int __init ibmvscsi_module_init(void)
1748 {
1749         int ret;
1750
1751         if (firmware_has_feature(FW_FEATURE_ISERIES))
1752                 ibmvscsi_ops = &iseriesvscsi_ops;
1753         else if (firmware_has_feature(FW_FEATURE_VIO))
1754                 ibmvscsi_ops = &rpavscsi_ops;
1755         else
1756                 return -ENODEV;
1757
1758         ibmvscsi_transport_template =
1759                 srp_attach_transport(&ibmvscsi_transport_functions);
1760         if (!ibmvscsi_transport_template)
1761                 return -ENOMEM;
1762
1763         ret = vio_register_driver(&ibmvscsi_driver);
1764         if (ret)
1765                 srp_release_transport(ibmvscsi_transport_template);
1766         return ret;
1767 }
1768
1769 void __exit ibmvscsi_module_exit(void)
1770 {
1771         vio_unregister_driver(&ibmvscsi_driver);
1772         srp_release_transport(ibmvscsi_transport_template);
1773 }
1774
1775 module_init(ibmvscsi_module_init);
1776 module_exit(ibmvscsi_module_exit);