VServer 1.9.2 (patch-2.6.8.1-vs1.9.2.diff)
[linux-2.6.git] / drivers / scsi / scsi_lib.c
1 /*
2  *  scsi_lib.c Copyright (C) 1999 Eric Youngdale
3  *
4  *  SCSI queueing library.
5  *      Initial versions: Eric Youngdale (eric@andante.org).
6  *                        Based upon conversations with large numbers
7  *                        of people at Linux Expo.
8  */
9
10 #include <linux/bio.h>
11 #include <linux/blkdev.h>
12 #include <linux/completion.h>
13 #include <linux/kernel.h>
14 #include <linux/mempool.h>
15 #include <linux/slab.h>
16 #include <linux/init.h>
17 #include <linux/pci.h>
18
19 #include <scsi/scsi.h>
20 #include <scsi/scsi_dbg.h>
21 #include <scsi/scsi_device.h>
22 #include <scsi/scsi_driver.h>
23 #include <scsi/scsi_eh.h>
24 #include <scsi/scsi_host.h>
25 #include <scsi/scsi_request.h>
26
27 #include "scsi_priv.h"
28 #include "scsi_logging.h"
29
30
31 #define SG_MEMPOOL_NR           (sizeof(scsi_sg_pools)/sizeof(struct scsi_host_sg_pool))
32 #define SG_MEMPOOL_SIZE         32
33
34 struct scsi_host_sg_pool {
35         size_t          size;
36         char            *name; 
37         kmem_cache_t    *slab;
38         mempool_t       *pool;
39 };
40
41 #if (SCSI_MAX_PHYS_SEGMENTS < 32)
42 #error SCSI_MAX_PHYS_SEGMENTS is too small
43 #endif
44
45 #define SP(x) { x, "sgpool-" #x } 
46 struct scsi_host_sg_pool scsi_sg_pools[] = { 
47         SP(8),
48         SP(16),
49         SP(32),
50 #if (SCSI_MAX_PHYS_SEGMENTS > 32)
51         SP(64),
52 #if (SCSI_MAX_PHYS_SEGMENTS > 64)
53         SP(128),
54 #if (SCSI_MAX_PHYS_SEGMENTS > 128)
55         SP(256),
56 #if (SCSI_MAX_PHYS_SEGMENTS > 256)
57 #error SCSI_MAX_PHYS_SEGMENTS is too large
58 #endif
59 #endif
60 #endif
61 #endif
62 };      
63 #undef SP
64
65
66 /*
67  * Function:    scsi_insert_special_req()
68  *
69  * Purpose:     Insert pre-formed request into request queue.
70  *
71  * Arguments:   sreq    - request that is ready to be queued.
72  *              at_head - boolean.  True if we should insert at head
73  *                        of queue, false if we should insert at tail.
74  *
75  * Lock status: Assumed that lock is not held upon entry.
76  *
77  * Returns:     Nothing
78  *
79  * Notes:       This function is called from character device and from
80  *              ioctl types of functions where the caller knows exactly
81  *              what SCSI command needs to be issued.   The idea is that
82  *              we merely inject the command into the queue (at the head
83  *              for now), and then call the queue request function to actually
84  *              process it.
85  */
86 int scsi_insert_special_req(struct scsi_request *sreq, int at_head)
87 {
88         /*
89          * Because users of this function are apt to reuse requests with no
90          * modification, we have to sanitise the request flags here
91          */
92         sreq->sr_request->flags &= ~REQ_DONTPREP;
93         blk_insert_request(sreq->sr_device->request_queue, sreq->sr_request,
94                            at_head, sreq, 0);
95         return 0;
96 }
97
98 /*
99  * Function:    scsi_queue_insert()
100  *
101  * Purpose:     Insert a command in the midlevel queue.
102  *
103  * Arguments:   cmd    - command that we are adding to queue.
104  *              reason - why we are inserting command to queue.
105  *
106  * Lock status: Assumed that lock is not held upon entry.
107  *
108  * Returns:     Nothing.
109  *
110  * Notes:       We do this for one of two cases.  Either the host is busy
111  *              and it cannot accept any more commands for the time being,
112  *              or the device returned QUEUE_FULL and can accept no more
113  *              commands.
114  * Notes:       This could be called either from an interrupt context or a
115  *              normal process context.
116  */
117 int scsi_queue_insert(struct scsi_cmnd *cmd, int reason)
118 {
119         struct Scsi_Host *host = cmd->device->host;
120         struct scsi_device *device = cmd->device;
121
122         SCSI_LOG_MLQUEUE(1,
123                  printk("Inserting command %p into mlqueue\n", cmd));
124
125         /*
126          * We are inserting the command into the ml queue.  First, we
127          * cancel the timer, so it doesn't time out.
128          */
129         scsi_delete_timer(cmd);
130
131         /*
132          * Next, set the appropriate busy bit for the device/host.
133          *
134          * If the host/device isn't busy, assume that something actually
135          * completed, and that we should be able to queue a command now.
136          *
137          * Note that the prior mid-layer assumption that any host could
138          * always queue at least one command is now broken.  The mid-layer
139          * will implement a user specifiable stall (see
140          * scsi_host.max_host_blocked and scsi_device.max_device_blocked)
141          * if a command is requeued with no other commands outstanding
142          * either for the device or for the host.
143          */
144         if (reason == SCSI_MLQUEUE_HOST_BUSY)
145                 host->host_blocked = host->max_host_blocked;
146         else if (reason == SCSI_MLQUEUE_DEVICE_BUSY)
147                 device->device_blocked = device->max_device_blocked;
148
149         /*
150          * Register the fact that we own the thing for now.
151          */
152         cmd->state = SCSI_STATE_MLQUEUE;
153         cmd->owner = SCSI_OWNER_MIDLEVEL;
154
155         /*
156          * Decrement the counters, since these commands are no longer
157          * active on the host/device.
158          */
159         scsi_device_unbusy(device);
160
161         /*
162          * Insert this command at the head of the queue for it's device.
163          * It will go before all other commands that are already in the queue.
164          *
165          * NOTE: there is magic here about the way the queue is plugged if
166          * we have no outstanding commands.
167          * 
168          * Although this *doesn't* plug the queue, it does call the request
169          * function.  The SCSI request function detects the blocked condition
170          * and plugs the queue appropriately.
171          */
172         blk_insert_request(device->request_queue, cmd->request, 1, cmd, 1);
173         return 0;
174 }
175
176 /*
177  * Function:    scsi_do_req
178  *
179  * Purpose:     Queue a SCSI request
180  *
181  * Arguments:   sreq      - command descriptor.
182  *              cmnd      - actual SCSI command to be performed.
183  *              buffer    - data buffer.
184  *              bufflen   - size of data buffer.
185  *              done      - completion function to be run.
186  *              timeout   - how long to let it run before timeout.
187  *              retries   - number of retries we allow.
188  *
189  * Lock status: No locks held upon entry.
190  *
191  * Returns:     Nothing.
192  *
193  * Notes:       This function is only used for queueing requests for things
194  *              like ioctls and character device requests - this is because
195  *              we essentially just inject a request into the queue for the
196  *              device.
197  *
198  *              In order to support the scsi_device_quiesce function, we
199  *              now inject requests on the *head* of the device queue
200  *              rather than the tail.
201  */
202 void scsi_do_req(struct scsi_request *sreq, const void *cmnd,
203                  void *buffer, unsigned bufflen,
204                  void (*done)(struct scsi_cmnd *),
205                  int timeout, int retries)
206 {
207         /*
208          * If the upper level driver is reusing these things, then
209          * we should release the low-level block now.  Another one will
210          * be allocated later when this request is getting queued.
211          */
212         __scsi_release_request(sreq);
213
214         /*
215          * Our own function scsi_done (which marks the host as not busy,
216          * disables the timeout counter, etc) will be called by us or by the
217          * scsi_hosts[host].queuecommand() function needs to also call
218          * the completion function for the high level driver.
219          */
220         memcpy(sreq->sr_cmnd, cmnd, sizeof(sreq->sr_cmnd));
221         sreq->sr_bufflen = bufflen;
222         sreq->sr_buffer = buffer;
223         sreq->sr_allowed = retries;
224         sreq->sr_done = done;
225         sreq->sr_timeout_per_command = timeout;
226
227         if (sreq->sr_cmd_len == 0)
228                 sreq->sr_cmd_len = COMMAND_SIZE(sreq->sr_cmnd[0]);
229
230         /*
231          * head injection *required* here otherwise quiesce won't work
232          */
233         scsi_insert_special_req(sreq, 1);
234 }
235  
236 static void scsi_wait_done(struct scsi_cmnd *cmd)
237 {
238         struct request *req = cmd->request;
239         struct request_queue *q = cmd->device->request_queue;
240         unsigned long flags;
241
242         req->rq_status = RQ_SCSI_DONE;  /* Busy, but indicate request done */
243
244         spin_lock_irqsave(q->queue_lock, flags);
245         if (blk_rq_tagged(req))
246                 blk_queue_end_tag(q, req);
247         spin_unlock_irqrestore(q->queue_lock, flags);
248
249         if (req->waiting)
250                 complete(req->waiting);
251 }
252
253 void scsi_wait_req(struct scsi_request *sreq, const void *cmnd, void *buffer,
254                    unsigned bufflen, int timeout, int retries)
255 {
256         DECLARE_COMPLETION(wait);
257         
258         sreq->sr_request->waiting = &wait;
259         sreq->sr_request->rq_status = RQ_SCSI_BUSY;
260         scsi_do_req(sreq, cmnd, buffer, bufflen, scsi_wait_done,
261                         timeout, retries);
262         wait_for_completion(&wait);
263         sreq->sr_request->waiting = NULL;
264         if (sreq->sr_request->rq_status != RQ_SCSI_DONE)
265                 sreq->sr_result |= (DRIVER_ERROR << 24);
266
267         __scsi_release_request(sreq);
268 }
269
270 /*
271  * Function:    scsi_init_cmd_errh()
272  *
273  * Purpose:     Initialize cmd fields related to error handling.
274  *
275  * Arguments:   cmd     - command that is ready to be queued.
276  *
277  * Returns:     Nothing
278  *
279  * Notes:       This function has the job of initializing a number of
280  *              fields related to error handling.   Typically this will
281  *              be called once for each command, as required.
282  */
283 static int scsi_init_cmd_errh(struct scsi_cmnd *cmd)
284 {
285         cmd->owner = SCSI_OWNER_MIDLEVEL;
286         cmd->serial_number = 0;
287         cmd->serial_number_at_timeout = 0;
288         cmd->abort_reason = 0;
289
290         memset(cmd->sense_buffer, 0, sizeof cmd->sense_buffer);
291
292         if (cmd->cmd_len == 0)
293                 cmd->cmd_len = COMMAND_SIZE(cmd->cmnd[0]);
294
295         /*
296          * We need saved copies of a number of fields - this is because
297          * error handling may need to overwrite these with different values
298          * to run different commands, and once error handling is complete,
299          * we will need to restore these values prior to running the actual
300          * command.
301          */
302         cmd->old_use_sg = cmd->use_sg;
303         cmd->old_cmd_len = cmd->cmd_len;
304         cmd->sc_old_data_direction = cmd->sc_data_direction;
305         cmd->old_underflow = cmd->underflow;
306         memcpy(cmd->data_cmnd, cmd->cmnd, sizeof(cmd->cmnd));
307         cmd->buffer = cmd->request_buffer;
308         cmd->bufflen = cmd->request_bufflen;
309         cmd->internal_timeout = NORMAL_TIMEOUT;
310         cmd->abort_reason = 0;
311
312         return 1;
313 }
314
315 /*
316  * Function:   scsi_setup_cmd_retry()
317  *
318  * Purpose:    Restore the command state for a retry
319  *
320  * Arguments:  cmd      - command to be restored
321  *
322  * Returns:    Nothing
323  *
324  * Notes:      Immediately prior to retrying a command, we need
325  *             to restore certain fields that we saved above.
326  */
327 void scsi_setup_cmd_retry(struct scsi_cmnd *cmd)
328 {
329         memcpy(cmd->cmnd, cmd->data_cmnd, sizeof(cmd->data_cmnd));
330         cmd->request_buffer = cmd->buffer;
331         cmd->request_bufflen = cmd->bufflen;
332         cmd->use_sg = cmd->old_use_sg;
333         cmd->cmd_len = cmd->old_cmd_len;
334         cmd->sc_data_direction = cmd->sc_old_data_direction;
335         cmd->underflow = cmd->old_underflow;
336 }
337
338 void scsi_device_unbusy(struct scsi_device *sdev)
339 {
340         struct Scsi_Host *shost = sdev->host;
341         unsigned long flags;
342
343         spin_lock_irqsave(shost->host_lock, flags);
344         shost->host_busy--;
345         if (unlikely(test_bit(SHOST_RECOVERY, &shost->shost_state) &&
346                      shost->host_failed))
347                 scsi_eh_wakeup(shost);
348         spin_unlock(shost->host_lock);
349         spin_lock(&sdev->sdev_lock);
350         sdev->device_busy--;
351         spin_unlock_irqrestore(&sdev->sdev_lock, flags);
352 }
353
354 /*
355  * Called for single_lun devices on IO completion. Clear starget_sdev_user,
356  * and call blk_run_queue for all the scsi_devices on the target -
357  * including current_sdev first.
358  *
359  * Called with *no* scsi locks held.
360  */
361 static void scsi_single_lun_run(struct scsi_device *current_sdev)
362 {
363         struct Scsi_Host *shost = current_sdev->host;
364         struct scsi_device *sdev, *tmp;
365         unsigned long flags;
366
367         spin_lock_irqsave(shost->host_lock, flags);
368         current_sdev->sdev_target->starget_sdev_user = NULL;
369         spin_unlock_irqrestore(shost->host_lock, flags);
370
371         /*
372          * Call blk_run_queue for all LUNs on the target, starting with
373          * current_sdev. We race with others (to set starget_sdev_user),
374          * but in most cases, we will be first. Ideally, each LU on the
375          * target would get some limited time or requests on the target.
376          */
377         blk_run_queue(current_sdev->request_queue);
378
379         spin_lock_irqsave(shost->host_lock, flags);
380         if (current_sdev->sdev_target->starget_sdev_user)
381                 goto out;
382         list_for_each_entry_safe(sdev, tmp, &current_sdev->same_target_siblings,
383                         same_target_siblings) {
384                 if (scsi_device_get(sdev))
385                         continue;
386
387                 spin_unlock_irqrestore(shost->host_lock, flags);
388                 blk_run_queue(sdev->request_queue);
389                 spin_lock_irqsave(shost->host_lock, flags);
390         
391                 scsi_device_put(sdev);
392         }
393  out:
394         spin_unlock_irqrestore(shost->host_lock, flags);
395 }
396
397 /*
398  * Function:    scsi_run_queue()
399  *
400  * Purpose:     Select a proper request queue to serve next
401  *
402  * Arguments:   q       - last request's queue
403  *
404  * Returns:     Nothing
405  *
406  * Notes:       The previous command was completely finished, start
407  *              a new one if possible.
408  */
409 static void scsi_run_queue(struct request_queue *q)
410 {
411         struct scsi_device *sdev = q->queuedata;
412         struct Scsi_Host *shost = sdev->host;
413         unsigned long flags;
414
415         if (sdev->single_lun)
416                 scsi_single_lun_run(sdev);
417
418         spin_lock_irqsave(shost->host_lock, flags);
419         while (!list_empty(&shost->starved_list) &&
420                !shost->host_blocked && !shost->host_self_blocked &&
421                 !((shost->can_queue > 0) &&
422                   (shost->host_busy >= shost->can_queue))) {
423                 /*
424                  * As long as shost is accepting commands and we have
425                  * starved queues, call blk_run_queue. scsi_request_fn
426                  * drops the queue_lock and can add us back to the
427                  * starved_list.
428                  *
429                  * host_lock protects the starved_list and starved_entry.
430                  * scsi_request_fn must get the host_lock before checking
431                  * or modifying starved_list or starved_entry.
432                  */
433                 sdev = list_entry(shost->starved_list.next,
434                                           struct scsi_device, starved_entry);
435                 list_del_init(&sdev->starved_entry);
436                 spin_unlock_irqrestore(shost->host_lock, flags);
437
438                 blk_run_queue(sdev->request_queue);
439
440                 spin_lock_irqsave(shost->host_lock, flags);
441                 if (unlikely(!list_empty(&sdev->starved_entry)))
442                         /*
443                          * sdev lost a race, and was put back on the
444                          * starved list. This is unlikely but without this
445                          * in theory we could loop forever.
446                          */
447                         break;
448         }
449         spin_unlock_irqrestore(shost->host_lock, flags);
450
451         blk_run_queue(q);
452 }
453
454 /*
455  * Function:    scsi_requeue_command()
456  *
457  * Purpose:     Handle post-processing of completed commands.
458  *
459  * Arguments:   q       - queue to operate on
460  *              cmd     - command that may need to be requeued.
461  *
462  * Returns:     Nothing
463  *
464  * Notes:       After command completion, there may be blocks left
465  *              over which weren't finished by the previous command
466  *              this can be for a number of reasons - the main one is
467  *              I/O errors in the middle of the request, in which case
468  *              we need to request the blocks that come after the bad
469  *              sector.
470  */
471 static void scsi_requeue_command(struct request_queue *q, struct scsi_cmnd *cmd)
472 {
473         cmd->request->flags &= ~REQ_DONTPREP;
474         blk_insert_request(q, cmd->request, 1, cmd, 1);
475
476         scsi_run_queue(q);
477 }
478
479 void scsi_next_command(struct scsi_cmnd *cmd)
480 {
481         struct request_queue *q = cmd->device->request_queue;
482
483         scsi_put_command(cmd);
484         scsi_run_queue(q);
485 }
486
487 void scsi_run_host_queues(struct Scsi_Host *shost)
488 {
489         struct scsi_device *sdev;
490
491         shost_for_each_device(sdev, shost)
492                 scsi_run_queue(sdev->request_queue);
493 }
494
495 /*
496  * Function:    scsi_end_request()
497  *
498  * Purpose:     Post-processing of completed commands called from interrupt
499  *              handler or a bottom-half handler.
500  *
501  * Arguments:   cmd      - command that is complete.
502  *              uptodate - 1 if I/O indicates success, 0 for I/O error.
503  *              sectors  - number of sectors we want to mark.
504  *              requeue  - indicates whether we should requeue leftovers.
505  *              frequeue - indicates that if we release the command block
506  *                         that the queue request function should be called.
507  *
508  * Lock status: Assumed that lock is not held upon entry.
509  *
510  * Returns:     Nothing
511  *
512  * Notes:       This is called for block device requests in order to
513  *              mark some number of sectors as complete.
514  * 
515  *              We are guaranteeing that the request queue will be goosed
516  *              at some point during this call.
517  */
518 static struct scsi_cmnd *scsi_end_request(struct scsi_cmnd *cmd, int uptodate,
519                                           int bytes, int requeue)
520 {
521         request_queue_t *q = cmd->device->request_queue;
522         struct request *req = cmd->request;
523         unsigned long flags;
524
525         /*
526          * If there are blocks left over at the end, set up the command
527          * to queue the remainder of them.
528          */
529         if (end_that_request_chunk(req, uptodate, bytes)) {
530                 int leftover = (req->hard_nr_sectors << 9);
531
532                 if (blk_pc_request(req))
533                         leftover = req->data_len;
534
535                 /* kill remainder if no retrys */
536                 if (!uptodate && blk_noretry_request(req))
537                         end_that_request_chunk(req, 0, leftover);
538                 else {
539                         if (requeue)
540                                 /*
541                                  * Bleah.  Leftovers again.  Stick the
542                                  * leftovers in the front of the
543                                  * queue, and goose the queue again.
544                                  */
545                                 scsi_requeue_command(q, cmd);
546
547                         return cmd;
548                 }
549         }
550
551         add_disk_randomness(req->rq_disk);
552
553         spin_lock_irqsave(q->queue_lock, flags);
554         if (blk_rq_tagged(req))
555                 blk_queue_end_tag(q, req);
556         end_that_request_last(req);
557         spin_unlock_irqrestore(q->queue_lock, flags);
558
559         /*
560          * This will goose the queue request function at the end, so we don't
561          * need to worry about launching another command.
562          */
563         scsi_next_command(cmd);
564         return NULL;
565 }
566
567 static struct scatterlist *scsi_alloc_sgtable(struct scsi_cmnd *cmd, int gfp_mask)
568 {
569         struct scsi_host_sg_pool *sgp;
570         struct scatterlist *sgl;
571
572         BUG_ON(!cmd->use_sg);
573
574         switch (cmd->use_sg) {
575         case 1 ... 8:
576                 cmd->sglist_len = 0;
577                 break;
578         case 9 ... 16:
579                 cmd->sglist_len = 1;
580                 break;
581         case 17 ... 32:
582                 cmd->sglist_len = 2;
583                 break;
584 #if (SCSI_MAX_PHYS_SEGMENTS > 32)
585         case 33 ... 64:
586                 cmd->sglist_len = 3;
587                 break;
588 #if (SCSI_MAX_PHYS_SEGMENTS > 64)
589         case 65 ... 128:
590                 cmd->sglist_len = 4;
591                 break;
592 #if (SCSI_MAX_PHYS_SEGMENTS  > 128)
593         case 129 ... 256:
594                 cmd->sglist_len = 5;
595                 break;
596 #endif
597 #endif
598 #endif
599         default:
600                 return NULL;
601         }
602
603         sgp = scsi_sg_pools + cmd->sglist_len;
604         sgl = mempool_alloc(sgp->pool, gfp_mask);
605         if (sgl)
606                 memset(sgl, 0, sgp->size);
607         return sgl;
608 }
609
610 static void scsi_free_sgtable(struct scatterlist *sgl, int index)
611 {
612         struct scsi_host_sg_pool *sgp;
613
614         BUG_ON(index > SG_MEMPOOL_NR);
615
616         sgp = scsi_sg_pools + index;
617         mempool_free(sgl, sgp->pool);
618 }
619
620 /*
621  * Function:    scsi_release_buffers()
622  *
623  * Purpose:     Completion processing for block device I/O requests.
624  *
625  * Arguments:   cmd     - command that we are bailing.
626  *
627  * Lock status: Assumed that no lock is held upon entry.
628  *
629  * Returns:     Nothing
630  *
631  * Notes:       In the event that an upper level driver rejects a
632  *              command, we must release resources allocated during
633  *              the __init_io() function.  Primarily this would involve
634  *              the scatter-gather table, and potentially any bounce
635  *              buffers.
636  */
637 static void scsi_release_buffers(struct scsi_cmnd *cmd)
638 {
639         struct request *req = cmd->request;
640
641         /*
642          * Free up any indirection buffers we allocated for DMA purposes. 
643          */
644         if (cmd->use_sg)
645                 scsi_free_sgtable(cmd->request_buffer, cmd->sglist_len);
646         else if (cmd->request_buffer != req->buffer)
647                 kfree(cmd->request_buffer);
648
649         /*
650          * Zero these out.  They now point to freed memory, and it is
651          * dangerous to hang onto the pointers.
652          */
653         cmd->buffer  = NULL;
654         cmd->bufflen = 0;
655         cmd->request_buffer = NULL;
656         cmd->request_bufflen = 0;
657 }
658
659 /*
660  * Function:    scsi_io_completion()
661  *
662  * Purpose:     Completion processing for block device I/O requests.
663  *
664  * Arguments:   cmd   - command that is finished.
665  *
666  * Lock status: Assumed that no lock is held upon entry.
667  *
668  * Returns:     Nothing
669  *
670  * Notes:       This function is matched in terms of capabilities to
671  *              the function that created the scatter-gather list.
672  *              In other words, if there are no bounce buffers
673  *              (the normal case for most drivers), we don't need
674  *              the logic to deal with cleaning up afterwards.
675  *
676  *              We must do one of several things here:
677  *
678  *              a) Call scsi_end_request.  This will finish off the
679  *                 specified number of sectors.  If we are done, the
680  *                 command block will be released, and the queue
681  *                 function will be goosed.  If we are not done, then
682  *                 scsi_end_request will directly goose the queue.
683  *
684  *              b) We can just use scsi_requeue_command() here.  This would
685  *                 be used if we just wanted to retry, for example.
686  */
687 void scsi_io_completion(struct scsi_cmnd *cmd, unsigned int good_bytes,
688                         unsigned int block_bytes)
689 {
690         int result = cmd->result;
691         int this_count = cmd->bufflen;
692         request_queue_t *q = cmd->device->request_queue;
693         struct request *req = cmd->request;
694         int clear_errors = 1;
695
696         /*
697          * Free up any indirection buffers we allocated for DMA purposes. 
698          * For the case of a READ, we need to copy the data out of the
699          * bounce buffer and into the real buffer.
700          */
701         if (cmd->use_sg)
702                 scsi_free_sgtable(cmd->buffer, cmd->sglist_len);
703         else if (cmd->buffer != req->buffer) {
704                 if (rq_data_dir(req) == READ) {
705                         unsigned long flags;
706                         char *to = bio_kmap_irq(req->bio, &flags);
707                         memcpy(to, cmd->buffer, cmd->bufflen);
708                         bio_kunmap_irq(to, &flags);
709                 }
710                 kfree(cmd->buffer);
711         }
712
713         if (blk_pc_request(req)) { /* SG_IO ioctl from block level */
714                 req->errors = (driver_byte(result) & DRIVER_SENSE) ?
715                               (CHECK_CONDITION << 1) : (result & 0xff);
716                 if (result) {
717                         clear_errors = 0;
718                         if (cmd->sense_buffer[0] & 0x70) {
719                                 int len = 8 + cmd->sense_buffer[7];
720
721                                 if (len > SCSI_SENSE_BUFFERSIZE)
722                                         len = SCSI_SENSE_BUFFERSIZE;
723                                 memcpy(req->sense, cmd->sense_buffer,  len);
724                                 req->sense_len = len;
725                         }
726                 } else
727                         req->data_len -= cmd->bufflen;
728         }
729
730         /*
731          * Zero these out.  They now point to freed memory, and it is
732          * dangerous to hang onto the pointers.
733          */
734         cmd->buffer  = NULL;
735         cmd->bufflen = 0;
736         cmd->request_buffer = NULL;
737         cmd->request_bufflen = 0;
738
739         /*
740          * Next deal with any sectors which we were able to correctly
741          * handle.
742          */
743         if (good_bytes >= 0) {
744                 SCSI_LOG_HLCOMPLETE(1, printk("%ld sectors total, %d bytes done.\n",
745                                               req->nr_sectors, good_bytes));
746                 SCSI_LOG_HLCOMPLETE(1, printk("use_sg is %d\n", cmd->use_sg));
747
748                 if (clear_errors)
749                         req->errors = 0;
750                 /*
751                  * If multiple sectors are requested in one buffer, then
752                  * they will have been finished off by the first command.
753                  * If not, then we have a multi-buffer command.
754                  *
755                  * If block_bytes != 0, it means we had a medium error
756                  * of some sort, and that we want to mark some number of
757                  * sectors as not uptodate.  Thus we want to inhibit
758                  * requeueing right here - we will requeue down below
759                  * when we handle the bad sectors.
760                  */
761                 cmd = scsi_end_request(cmd, 1, good_bytes, result == 0);
762
763                 /*
764                  * If the command completed without error, then either finish off the
765                  * rest of the command, or start a new one.
766                  */
767                 if (result == 0 || cmd == NULL ) {
768                         return;
769                 }
770         }
771         /*
772          * Now, if we were good little boys and girls, Santa left us a request
773          * sense buffer.  We can extract information from this, so we
774          * can choose a block to remap, etc.
775          */
776         if (driver_byte(result) != 0) {
777                 if ((cmd->sense_buffer[0] & 0x7f) == 0x70) {
778                         /*
779                          * If the device is in the process of becoming ready,
780                          * retry.
781                          */
782                         if (cmd->sense_buffer[12] == 0x04 &&
783                             cmd->sense_buffer[13] == 0x01) {
784                                 scsi_requeue_command(q, cmd);
785                                 return;
786                         }
787                         if ((cmd->sense_buffer[2] & 0xf) == UNIT_ATTENTION) {
788                                 if (cmd->device->removable) {
789                                         /* detected disc change.  set a bit 
790                                          * and quietly refuse further access.
791                                          */
792                                         cmd->device->changed = 1;
793                                         cmd = scsi_end_request(cmd, 0,
794                                                         this_count, 1);
795                                         return;
796                                 } else {
797                                         /*
798                                         * Must have been a power glitch, or a
799                                         * bus reset.  Could not have been a
800                                         * media change, so we just retry the
801                                         * request and see what happens.  
802                                         */
803                                         scsi_requeue_command(q, cmd);
804                                         return;
805                                 }
806                         }
807                 }
808                 /*
809                  * If we had an ILLEGAL REQUEST returned, then we may have
810                  * performed an unsupported command.  The only thing this
811                  * should be would be a ten byte read where only a six byte
812                  * read was supported.  Also, on a system where READ CAPACITY
813                  * failed, we may have read past the end of the disk.
814                  */
815
816                 switch (cmd->sense_buffer[2]) {
817                 case ILLEGAL_REQUEST:
818                         if (cmd->device->use_10_for_rw &&
819                             (cmd->cmnd[0] == READ_10 ||
820                              cmd->cmnd[0] == WRITE_10)) {
821                                 cmd->device->use_10_for_rw = 0;
822                                 /*
823                                  * This will cause a retry with a 6-byte
824                                  * command.
825                                  */
826                                 scsi_requeue_command(q, cmd);
827                                 result = 0;
828                         } else {
829                                 cmd = scsi_end_request(cmd, 0, this_count, 1);
830                                 return;
831                         }
832                         break;
833                 case NOT_READY:
834                         printk(KERN_INFO "Device %s not ready.\n",
835                                req->rq_disk ? req->rq_disk->disk_name : "");
836                         cmd = scsi_end_request(cmd, 0, this_count, 1);
837                         return;
838                         break;
839                 case MEDIUM_ERROR:
840                 case VOLUME_OVERFLOW:
841                         printk("scsi%d: ERROR on channel %d, id %d, lun %d, CDB: ",
842                                cmd->device->host->host_no, (int) cmd->device->channel,
843                                (int) cmd->device->id, (int) cmd->device->lun);
844                         __scsi_print_command(cmd->data_cmnd);
845                         scsi_print_sense("", cmd);
846                         cmd = scsi_end_request(cmd, 0, block_bytes, 1);
847                         return;
848                 default:
849                         break;
850                 }
851         }                       /* driver byte != 0 */
852         if (host_byte(result) == DID_RESET) {
853                 /*
854                  * Third party bus reset or reset for error
855                  * recovery reasons.  Just retry the request
856                  * and see what happens.  
857                  */
858                 scsi_requeue_command(q, cmd);
859                 return;
860         }
861         if (result) {
862                 printk("SCSI error : <%d %d %d %d> return code = 0x%x\n",
863                        cmd->device->host->host_no,
864                        cmd->device->channel,
865                        cmd->device->id,
866                        cmd->device->lun, result);
867
868                 if (driver_byte(result) & DRIVER_SENSE)
869                         scsi_print_sense("", cmd);
870                 /*
871                  * Mark a single buffer as not uptodate.  Queue the remainder.
872                  * We sometimes get this cruft in the event that a medium error
873                  * isn't properly reported.
874                  */
875                 block_bytes = req->hard_cur_sectors << 9;
876                 if (!block_bytes)
877                         block_bytes = req->data_len;
878                 cmd = scsi_end_request(cmd, 0, block_bytes, 1);
879         }
880 }
881
882 /*
883  * Function:    scsi_init_io()
884  *
885  * Purpose:     SCSI I/O initialize function.
886  *
887  * Arguments:   cmd   - Command descriptor we wish to initialize
888  *
889  * Returns:     0 on success
890  *              BLKPREP_DEFER if the failure is retryable
891  *              BLKPREP_KILL if the failure is fatal
892  */
893 static int scsi_init_io(struct scsi_cmnd *cmd)
894 {
895         struct request     *req = cmd->request;
896         struct scatterlist *sgpnt;
897         int                count;
898
899         /*
900          * if this is a rq->data based REQ_BLOCK_PC, setup for a non-sg xfer
901          */
902         if ((req->flags & REQ_BLOCK_PC) && !req->bio) {
903                 cmd->request_bufflen = req->data_len;
904                 cmd->request_buffer = req->data;
905                 req->buffer = req->data;
906                 cmd->use_sg = 0;
907                 return 0;
908         }
909
910         /*
911          * we used to not use scatter-gather for single segment request,
912          * but now we do (it makes highmem I/O easier to support without
913          * kmapping pages)
914          */
915         cmd->use_sg = req->nr_phys_segments;
916
917         /*
918          * if sg table allocation fails, requeue request later.
919          */
920         sgpnt = scsi_alloc_sgtable(cmd, GFP_ATOMIC);
921         if (unlikely(!sgpnt)) {
922                 req->flags |= REQ_SPECIAL;
923                 return BLKPREP_DEFER;
924         }
925
926         cmd->request_buffer = (char *) sgpnt;
927         cmd->request_bufflen = req->nr_sectors << 9;
928         if (blk_pc_request(req))
929                 cmd->request_bufflen = req->data_len;
930         req->buffer = NULL;
931
932         /* 
933          * Next, walk the list, and fill in the addresses and sizes of
934          * each segment.
935          */
936         count = blk_rq_map_sg(req->q, req, cmd->request_buffer);
937
938         /*
939          * mapped well, send it off
940          */
941         if (likely(count <= cmd->use_sg)) {
942                 cmd->use_sg = count;
943                 return 0;
944         }
945
946         printk(KERN_ERR "Incorrect number of segments after building list\n");
947         printk(KERN_ERR "counted %d, received %d\n", count, cmd->use_sg);
948         printk(KERN_ERR "req nr_sec %lu, cur_nr_sec %u\n", req->nr_sectors,
949                         req->current_nr_sectors);
950
951         /* release the command and kill it */
952         scsi_release_buffers(cmd);
953         scsi_put_command(cmd);
954         return BLKPREP_KILL;
955 }
956
957 static int scsi_prep_fn(struct request_queue *q, struct request *req)
958 {
959         struct scsi_device *sdev = q->queuedata;
960         struct scsi_cmnd *cmd;
961         int specials_only = 0;
962
963         /*
964          * Just check to see if the device is online.  If it isn't, we
965          * refuse to process any commands.  The device must be brought
966          * online before trying any recovery commands
967          */
968         if (unlikely(!scsi_device_online(sdev))) {
969                 printk(KERN_ERR "scsi%d (%d:%d): rejecting I/O to offline device\n",
970                        sdev->host->host_no, sdev->id, sdev->lun);
971                 return BLKPREP_KILL;
972         }
973         if (unlikely(sdev->sdev_state != SDEV_RUNNING)) {
974                 /* OK, we're not in a running state don't prep
975                  * user commands */
976                 if (sdev->sdev_state == SDEV_DEL) {
977                         /* Device is fully deleted, no commands
978                          * at all allowed down */
979                         printk(KERN_ERR "scsi%d (%d:%d): rejecting I/O to dead device\n",
980                                sdev->host->host_no, sdev->id, sdev->lun);
981                         return BLKPREP_KILL;
982                 }
983                 /* OK, we only allow special commands (i.e. not
984                  * user initiated ones */
985                 specials_only = sdev->sdev_state;
986         }
987
988         /*
989          * Find the actual device driver associated with this command.
990          * The SPECIAL requests are things like character device or
991          * ioctls, which did not originate from ll_rw_blk.  Note that
992          * the special field is also used to indicate the cmd for
993          * the remainder of a partially fulfilled request that can 
994          * come up when there is a medium error.  We have to treat
995          * these two cases differently.  We differentiate by looking
996          * at request->cmd, as this tells us the real story.
997          */
998         if (req->flags & REQ_SPECIAL) {
999                 struct scsi_request *sreq = req->special;
1000
1001                 if (sreq->sr_magic == SCSI_REQ_MAGIC) {
1002                         cmd = scsi_get_command(sreq->sr_device, GFP_ATOMIC);
1003                         if (unlikely(!cmd))
1004                                 goto defer;
1005                         scsi_init_cmd_from_req(cmd, sreq);
1006                 } else
1007                         cmd = req->special;
1008         } else if (req->flags & (REQ_CMD | REQ_BLOCK_PC)) {
1009
1010                 if(unlikely(specials_only)) {
1011                         if(specials_only == SDEV_QUIESCE)
1012                                 return BLKPREP_DEFER;
1013                         
1014                         printk(KERN_ERR "scsi%d (%d:%d): rejecting I/O to device being removed\n",
1015                                sdev->host->host_no, sdev->id, sdev->lun);
1016                         return BLKPREP_KILL;
1017                 }
1018                         
1019                         
1020                 /*
1021                  * Now try and find a command block that we can use.
1022                  */
1023                 if (!req->special) {
1024                         cmd = scsi_get_command(sdev, GFP_ATOMIC);
1025                         if (unlikely(!cmd))
1026                                 goto defer;
1027                 } else
1028                         cmd = req->special;
1029                 
1030                 /* pull a tag out of the request if we have one */
1031                 cmd->tag = req->tag;
1032         } else {
1033                 blk_dump_rq_flags(req, "SCSI bad req");
1034                 return BLKPREP_KILL;
1035         }
1036         
1037         /* note the overloading of req->special.  When the tag
1038          * is active it always means cmd.  If the tag goes
1039          * back for re-queueing, it may be reset */
1040         req->special = cmd;
1041         cmd->request = req;
1042         
1043         /*
1044          * FIXME: drop the lock here because the functions below
1045          * expect to be called without the queue lock held.  Also,
1046          * previously, we dequeued the request before dropping the
1047          * lock.  We hope REQ_STARTED prevents anything untoward from
1048          * happening now.
1049          */
1050         if (req->flags & (REQ_CMD | REQ_BLOCK_PC)) {
1051                 struct scsi_driver *drv;
1052                 int ret;
1053
1054                 /*
1055                  * This will do a couple of things:
1056                  *  1) Fill in the actual SCSI command.
1057                  *  2) Fill in any other upper-level specific fields
1058                  * (timeout).
1059                  *
1060                  * If this returns 0, it means that the request failed
1061                  * (reading past end of disk, reading offline device,
1062                  * etc).   This won't actually talk to the device, but
1063                  * some kinds of consistency checking may cause the     
1064                  * request to be rejected immediately.
1065                  */
1066
1067                 /* 
1068                  * This sets up the scatter-gather table (allocating if
1069                  * required).
1070                  */
1071                 ret = scsi_init_io(cmd);
1072                 if (ret)        /* BLKPREP_KILL return also releases the command */
1073                         return ret;
1074                 
1075                 /*
1076                  * Initialize the actual SCSI command for this request.
1077                  */
1078                 drv = *(struct scsi_driver **)req->rq_disk->private_data;
1079                 if (unlikely(!drv->init_command(cmd))) {
1080                         scsi_release_buffers(cmd);
1081                         scsi_put_command(cmd);
1082                         return BLKPREP_KILL;
1083                 }
1084         }
1085
1086         /*
1087          * The request is now prepped, no need to come back here
1088          */
1089         req->flags |= REQ_DONTPREP;
1090         return BLKPREP_OK;
1091
1092  defer:
1093         /* If we defer, the elv_next_request() returns NULL, but the
1094          * queue must be restarted, so we plug here if no returning
1095          * command will automatically do that. */
1096         if (sdev->device_busy == 0)
1097                 blk_plug_device(q);
1098         return BLKPREP_DEFER;
1099 }
1100
1101 /*
1102  * scsi_dev_queue_ready: if we can send requests to sdev, return 1 else
1103  * return 0.
1104  *
1105  * Called with the queue_lock held.
1106  */
1107 static inline int scsi_dev_queue_ready(struct request_queue *q,
1108                                   struct scsi_device *sdev)
1109 {
1110         if (sdev->device_busy >= sdev->queue_depth)
1111                 return 0;
1112         if (sdev->device_busy == 0 && sdev->device_blocked) {
1113                 /*
1114                  * unblock after device_blocked iterates to zero
1115                  */
1116                 if (--sdev->device_blocked == 0) {
1117                         SCSI_LOG_MLQUEUE(3,
1118                                 printk("scsi%d (%d:%d) unblocking device at"
1119                                        " zero depth\n", sdev->host->host_no,
1120                                        sdev->id, sdev->lun));
1121                 } else {
1122                         blk_plug_device(q);
1123                         return 0;
1124                 }
1125         }
1126         if (sdev->device_blocked)
1127                 return 0;
1128
1129         return 1;
1130 }
1131
1132 /*
1133  * scsi_host_queue_ready: if we can send requests to shost, return 1 else
1134  * return 0. We must end up running the queue again whenever 0 is
1135  * returned, else IO can hang.
1136  *
1137  * Called with host_lock held.
1138  */
1139 static inline int scsi_host_queue_ready(struct request_queue *q,
1140                                    struct Scsi_Host *shost,
1141                                    struct scsi_device *sdev)
1142 {
1143         if (test_bit(SHOST_RECOVERY, &shost->shost_state))
1144                 return 0;
1145         if (shost->host_busy == 0 && shost->host_blocked) {
1146                 /*
1147                  * unblock after host_blocked iterates to zero
1148                  */
1149                 if (--shost->host_blocked == 0) {
1150                         SCSI_LOG_MLQUEUE(3,
1151                                 printk("scsi%d unblocking host at zero depth\n",
1152                                         shost->host_no));
1153                 } else {
1154                         blk_plug_device(q);
1155                         return 0;
1156                 }
1157         }
1158         if ((shost->can_queue > 0 && shost->host_busy >= shost->can_queue) ||
1159             shost->host_blocked || shost->host_self_blocked) {
1160                 if (list_empty(&sdev->starved_entry))
1161                         list_add_tail(&sdev->starved_entry, &shost->starved_list);
1162                 return 0;
1163         }
1164
1165         /* We're OK to process the command, so we can't be starved */
1166         if (!list_empty(&sdev->starved_entry))
1167                 list_del_init(&sdev->starved_entry);
1168
1169         return 1;
1170 }
1171
1172 /*
1173  * Function:    scsi_request_fn()
1174  *
1175  * Purpose:     Main strategy routine for SCSI.
1176  *
1177  * Arguments:   q       - Pointer to actual queue.
1178  *
1179  * Returns:     Nothing
1180  *
1181  * Lock status: IO request lock assumed to be held when called.
1182  */
1183 static void scsi_request_fn(struct request_queue *q)
1184 {
1185         struct scsi_device *sdev = q->queuedata;
1186         struct Scsi_Host *shost = sdev->host;
1187         struct scsi_cmnd *cmd;
1188         struct request *req;
1189
1190         if(!get_device(&sdev->sdev_gendev))
1191                 /* We must be tearing the block queue down already */
1192                 return;
1193
1194         /*
1195          * To start with, we keep looping until the queue is empty, or until
1196          * the host is no longer able to accept any more requests.
1197          */
1198         while (!blk_queue_plugged(q)) {
1199                 int rtn;
1200                 /*
1201                  * get next queueable request.  We do this early to make sure
1202                  * that the request is fully prepared even if we cannot 
1203                  * accept it.
1204                  */
1205                 req = elv_next_request(q);
1206                 if (!req || !scsi_dev_queue_ready(q, sdev))
1207                         break;
1208
1209                 if (unlikely(!scsi_device_online(sdev))) {
1210                         printk(KERN_ERR "scsi%d (%d:%d): rejecting I/O to offline device\n",
1211                                sdev->host->host_no, sdev->id, sdev->lun);
1212                         blkdev_dequeue_request(req);
1213                         req->flags |= REQ_QUIET;
1214                         while (end_that_request_first(req, 0, req->nr_sectors))
1215                                 ;
1216                         end_that_request_last(req);
1217                         continue;
1218                 }
1219
1220
1221                 /*
1222                  * Remove the request from the request list.
1223                  */
1224                 if (!(blk_queue_tagged(q) && !blk_queue_start_tag(q, req)))
1225                         blkdev_dequeue_request(req);
1226                 sdev->device_busy++;
1227
1228                 spin_unlock(q->queue_lock);
1229                 spin_lock(shost->host_lock);
1230
1231                 if (!scsi_host_queue_ready(q, shost, sdev))
1232                         goto not_ready;
1233                 if (sdev->single_lun) {
1234                         if (sdev->sdev_target->starget_sdev_user &&
1235                             sdev->sdev_target->starget_sdev_user != sdev)
1236                                 goto not_ready;
1237                         sdev->sdev_target->starget_sdev_user = sdev;
1238                 }
1239                 shost->host_busy++;
1240
1241                 /*
1242                  * XXX(hch): This is rather suboptimal, scsi_dispatch_cmd will
1243                  *              take the lock again.
1244                  */
1245                 spin_unlock_irq(shost->host_lock);
1246
1247                 cmd = req->special;
1248                 if (unlikely(cmd == NULL)) {
1249                         printk(KERN_CRIT "impossible request in %s.\n"
1250                                          "please mail a stack trace to "
1251                                          "linux-scsi@vger.kernel.org",
1252                                          __FUNCTION__);
1253                         BUG();
1254                 }
1255
1256                 /*
1257                  * Finally, initialize any error handling parameters, and set up
1258                  * the timers for timeouts.
1259                  */
1260                 scsi_init_cmd_errh(cmd);
1261
1262                 /*
1263                  * Dispatch the command to the low-level driver.
1264                  */
1265                 rtn = scsi_dispatch_cmd(cmd);
1266                 spin_lock_irq(q->queue_lock);
1267                 if(rtn) {
1268                         /* we're refusing the command; because of
1269                          * the way locks get dropped, we need to 
1270                          * check here if plugging is required */
1271                         if(sdev->device_busy == 0)
1272                                 blk_plug_device(q);
1273
1274                         break;
1275                 }
1276         }
1277
1278         goto out;
1279
1280  not_ready:
1281         spin_unlock_irq(shost->host_lock);
1282
1283         /*
1284          * lock q, handle tag, requeue req, and decrement device_busy. We
1285          * must return with queue_lock held.
1286          *
1287          * Decrementing device_busy without checking it is OK, as all such
1288          * cases (host limits or settings) should run the queue at some
1289          * later time.
1290          */
1291         spin_lock_irq(q->queue_lock);
1292         blk_requeue_request(q, req);
1293         sdev->device_busy--;
1294         if(sdev->device_busy == 0)
1295                 blk_plug_device(q);
1296  out:
1297         /* must be careful here...if we trigger the ->remove() function
1298          * we cannot be holding the q lock */
1299         spin_unlock_irq(q->queue_lock);
1300         put_device(&sdev->sdev_gendev);
1301         spin_lock_irq(q->queue_lock);
1302 }
1303
1304 u64 scsi_calculate_bounce_limit(struct Scsi_Host *shost)
1305 {
1306         struct device *host_dev;
1307
1308         if (shost->unchecked_isa_dma)
1309                 return BLK_BOUNCE_ISA;
1310
1311         host_dev = scsi_get_device(shost);
1312         if (PCI_DMA_BUS_IS_PHYS && host_dev && host_dev->dma_mask)
1313                 return *host_dev->dma_mask;
1314
1315         /*
1316          * Platforms with virtual-DMA translation
1317          * hardware have no practical limit.
1318          */
1319         return BLK_BOUNCE_ANY;
1320 }
1321
1322 struct request_queue *scsi_alloc_queue(struct scsi_device *sdev)
1323 {
1324         struct Scsi_Host *shost = sdev->host;
1325         struct request_queue *q;
1326
1327         q = blk_init_queue(scsi_request_fn, &sdev->sdev_lock);
1328         if (!q)
1329                 return NULL;
1330
1331         blk_queue_prep_rq(q, scsi_prep_fn);
1332
1333         blk_queue_max_hw_segments(q, shost->sg_tablesize);
1334         blk_queue_max_phys_segments(q, SCSI_MAX_PHYS_SEGMENTS);
1335         blk_queue_max_sectors(q, shost->max_sectors);
1336         blk_queue_bounce_limit(q, scsi_calculate_bounce_limit(shost));
1337         blk_queue_segment_boundary(q, shost->dma_boundary);
1338  
1339         if (!shost->use_clustering)
1340                 clear_bit(QUEUE_FLAG_CLUSTER, &q->queue_flags);
1341         return q;
1342 }
1343
1344 void scsi_free_queue(struct request_queue *q)
1345 {
1346         blk_cleanup_queue(q);
1347 }
1348
1349 /*
1350  * Function:    scsi_block_requests()
1351  *
1352  * Purpose:     Utility function used by low-level drivers to prevent further
1353  *              commands from being queued to the device.
1354  *
1355  * Arguments:   shost       - Host in question
1356  *
1357  * Returns:     Nothing
1358  *
1359  * Lock status: No locks are assumed held.
1360  *
1361  * Notes:       There is no timer nor any other means by which the requests
1362  *              get unblocked other than the low-level driver calling
1363  *              scsi_unblock_requests().
1364  */
1365 void scsi_block_requests(struct Scsi_Host *shost)
1366 {
1367         shost->host_self_blocked = 1;
1368 }
1369
1370 /*
1371  * Function:    scsi_unblock_requests()
1372  *
1373  * Purpose:     Utility function used by low-level drivers to allow further
1374  *              commands from being queued to the device.
1375  *
1376  * Arguments:   shost       - Host in question
1377  *
1378  * Returns:     Nothing
1379  *
1380  * Lock status: No locks are assumed held.
1381  *
1382  * Notes:       There is no timer nor any other means by which the requests
1383  *              get unblocked other than the low-level driver calling
1384  *              scsi_unblock_requests().
1385  *
1386  *              This is done as an API function so that changes to the
1387  *              internals of the scsi mid-layer won't require wholesale
1388  *              changes to drivers that use this feature.
1389  */
1390 void scsi_unblock_requests(struct Scsi_Host *shost)
1391 {
1392         shost->host_self_blocked = 0;
1393         scsi_run_host_queues(shost);
1394 }
1395
1396 int __init scsi_init_queue(void)
1397 {
1398         int i;
1399
1400         for (i = 0; i < SG_MEMPOOL_NR; i++) {
1401                 struct scsi_host_sg_pool *sgp = scsi_sg_pools + i;
1402                 int size = sgp->size * sizeof(struct scatterlist);
1403
1404                 sgp->slab = kmem_cache_create(sgp->name, size, 0,
1405                                 SLAB_HWCACHE_ALIGN, NULL, NULL);
1406                 if (!sgp->slab) {
1407                         printk(KERN_ERR "SCSI: can't init sg slab %s\n",
1408                                         sgp->name);
1409                 }
1410
1411                 sgp->pool = mempool_create(SG_MEMPOOL_SIZE,
1412                                 mempool_alloc_slab, mempool_free_slab,
1413                                 sgp->slab);
1414                 if (!sgp->pool) {
1415                         printk(KERN_ERR "SCSI: can't init sg mempool %s\n",
1416                                         sgp->name);
1417                 }
1418         }
1419
1420         return 0;
1421 }
1422
1423 void scsi_exit_queue(void)
1424 {
1425         int i;
1426
1427         for (i = 0; i < SG_MEMPOOL_NR; i++) {
1428                 struct scsi_host_sg_pool *sgp = scsi_sg_pools + i;
1429                 mempool_destroy(sgp->pool);
1430                 kmem_cache_destroy(sgp->slab);
1431         }
1432 }
1433 /**
1434  *      __scsi_mode_sense - issue a mode sense, falling back from 10 to 
1435  *              six bytes if necessary.
1436  *      @sreq:  SCSI request to fill in with the MODE_SENSE
1437  *      @dbd:   set if mode sense will allow block descriptors to be returned
1438  *      @modepage: mode page being requested
1439  *      @buffer: request buffer (may not be smaller than eight bytes)
1440  *      @len:   length of request buffer.
1441  *      @timeout: command timeout
1442  *      @retries: number of retries before failing
1443  *      @data: returns a structure abstracting the mode header data
1444  *
1445  *      Returns zero if unsuccessful, or the header offset (either 4
1446  *      or 8 depending on whether a six or ten byte command was
1447  *      issued) if successful.
1448  **/
1449 int
1450 __scsi_mode_sense(struct scsi_request *sreq, int dbd, int modepage,
1451                   unsigned char *buffer, int len, int timeout, int retries,
1452                   struct scsi_mode_data *data) {
1453         unsigned char cmd[12];
1454         int use_10_for_ms;
1455         int header_length;
1456
1457         memset(data, 0, sizeof(*data));
1458         memset(&cmd[0], 0, 12);
1459         cmd[1] = dbd & 0x18;    /* allows DBD and LLBA bits */
1460         cmd[2] = modepage;
1461
1462  retry:
1463         use_10_for_ms = sreq->sr_device->use_10_for_ms;
1464
1465         if (use_10_for_ms) {
1466                 if (len < 8)
1467                         len = 8;
1468
1469                 cmd[0] = MODE_SENSE_10;
1470                 cmd[8] = len;
1471                 header_length = 8;
1472         } else {
1473                 if (len < 4)
1474                         len = 4;
1475
1476                 cmd[0] = MODE_SENSE;
1477                 cmd[4] = len;
1478                 header_length = 4;
1479         }
1480
1481         sreq->sr_cmd_len = 0;
1482         sreq->sr_sense_buffer[0] = 0;
1483         sreq->sr_sense_buffer[2] = 0;
1484         sreq->sr_data_direction = DMA_FROM_DEVICE;
1485
1486         memset(buffer, 0, len);
1487
1488         scsi_wait_req(sreq, cmd, buffer, len, timeout, retries);
1489
1490         /* This code looks awful: what it's doing is making sure an
1491          * ILLEGAL REQUEST sense return identifies the actual command
1492          * byte as the problem.  MODE_SENSE commands can return
1493          * ILLEGAL REQUEST if the code page isn't supported */
1494         if (use_10_for_ms && ! scsi_status_is_good(sreq->sr_result) &&
1495             (driver_byte(sreq->sr_result) & DRIVER_SENSE) &&
1496             sreq->sr_sense_buffer[2] == ILLEGAL_REQUEST &&
1497             (sreq->sr_sense_buffer[4] & 0x40) == 0x40 &&
1498             sreq->sr_sense_buffer[5] == 0 &&
1499             sreq->sr_sense_buffer[6] == 0 ) {
1500                 sreq->sr_device->use_10_for_ms = 0;
1501                 goto retry;
1502         }
1503
1504         if(scsi_status_is_good(sreq->sr_result)) {
1505                 data->header_length = header_length;
1506                 if(use_10_for_ms) {
1507                         data->length = buffer[0]*256 + buffer[1] + 2;
1508                         data->medium_type = buffer[2];
1509                         data->device_specific = buffer[3];
1510                         data->longlba = buffer[4] & 0x01;
1511                         data->block_descriptor_length = buffer[6]*256
1512                                 + buffer[7];
1513                 } else {
1514                         data->length = buffer[0] + 1;
1515                         data->medium_type = buffer[1];
1516                         data->device_specific = buffer[2];
1517                         data->block_descriptor_length = buffer[3];
1518                 }
1519         }
1520
1521         return sreq->sr_result;
1522 }
1523
1524 /**
1525  *      scsi_mode_sense - issue a mode sense, falling back from 10 to 
1526  *              six bytes if necessary.
1527  *      @sdev:  scsi device to send command to.
1528  *      @dbd:   set if mode sense will disable block descriptors in the return
1529  *      @modepage: mode page being requested
1530  *      @buffer: request buffer (may not be smaller than eight bytes)
1531  *      @len:   length of request buffer.
1532  *      @timeout: command timeout
1533  *      @retries: number of retries before failing
1534  *
1535  *      Returns zero if unsuccessful, or the header offset (either 4
1536  *      or 8 depending on whether a six or ten byte command was
1537  *      issued) if successful.
1538  **/
1539 int
1540 scsi_mode_sense(struct scsi_device *sdev, int dbd, int modepage,
1541                 unsigned char *buffer, int len, int timeout, int retries,
1542                 struct scsi_mode_data *data)
1543 {
1544         struct scsi_request *sreq = scsi_allocate_request(sdev, GFP_KERNEL);
1545         int ret;
1546
1547         if (!sreq)
1548                 return -1;
1549
1550         ret = __scsi_mode_sense(sreq, dbd, modepage, buffer, len,
1551                                 timeout, retries, data);
1552
1553         scsi_release_request(sreq);
1554
1555         return ret;
1556 }
1557
1558 /**
1559  *      scsi_device_set_state - Take the given device through the device
1560  *              state model.
1561  *      @sdev:  scsi device to change the state of.
1562  *      @state: state to change to.
1563  *
1564  *      Returns zero if unsuccessful or an error if the requested 
1565  *      transition is illegal.
1566  **/
1567 int
1568 scsi_device_set_state(struct scsi_device *sdev, enum scsi_device_state state)
1569 {
1570         enum scsi_device_state oldstate = sdev->sdev_state;
1571
1572         if (state == oldstate)
1573                 return 0;
1574
1575         switch (state) {
1576         case SDEV_CREATED:
1577                 /* There are no legal states that come back to
1578                  * created.  This is the manually initialised start
1579                  * state */
1580                 goto illegal;
1581                         
1582         case SDEV_RUNNING:
1583                 switch (oldstate) {
1584                 case SDEV_CREATED:
1585                 case SDEV_OFFLINE:
1586                 case SDEV_QUIESCE:
1587                         break;
1588                 default:
1589                         goto illegal;
1590                 }
1591                 break;
1592
1593         case SDEV_QUIESCE:
1594                 switch (oldstate) {
1595                 case SDEV_RUNNING:
1596                 case SDEV_OFFLINE:
1597                         break;
1598                 default:
1599                         goto illegal;
1600                 }
1601                 break;
1602
1603         case SDEV_OFFLINE:
1604                 switch (oldstate) {
1605                 case SDEV_CREATED:
1606                 case SDEV_RUNNING:
1607                 case SDEV_QUIESCE:
1608                         break;
1609                 default:
1610                         goto illegal;
1611                 }
1612                 break;
1613
1614         case SDEV_CANCEL:
1615                 switch (oldstate) {
1616                 case SDEV_CREATED:
1617                 case SDEV_RUNNING:
1618                 case SDEV_OFFLINE:
1619                         break;
1620                 default:
1621                         goto illegal;
1622                 }
1623                 break;
1624
1625         case SDEV_DEL:
1626                 switch (oldstate) {
1627                 case SDEV_CANCEL:
1628                         break;
1629                 default:
1630                         goto illegal;
1631                 }
1632                 break;
1633
1634         }
1635         sdev->sdev_state = state;
1636         return 0;
1637
1638  illegal:
1639         dev_printk(KERN_ERR, &sdev->sdev_gendev,
1640                    "Illegal state transition %s->%s\n",
1641                    scsi_device_state_name(oldstate),
1642                    scsi_device_state_name(state));
1643         WARN_ON(1);
1644         return -EINVAL;
1645 }
1646 EXPORT_SYMBOL(scsi_device_set_state);
1647
1648 /**
1649  *      scsi_device_quiesce - Block user issued commands.
1650  *      @sdev:  scsi device to quiesce.
1651  *
1652  *      This works by trying to transition to the SDEV_QUIESCE state
1653  *      (which must be a legal transition).  When the device is in this
1654  *      state, only special requests will be accepted, all others will
1655  *      be deferred.  Since special requests may also be requeued requests,
1656  *      a successful return doesn't guarantee the device will be 
1657  *      totally quiescent.
1658  *
1659  *      Must be called with user context, may sleep.
1660  *
1661  *      Returns zero if unsuccessful or an error if not.
1662  **/
1663 int
1664 scsi_device_quiesce(struct scsi_device *sdev)
1665 {
1666         int err = scsi_device_set_state(sdev, SDEV_QUIESCE);
1667         if (err)
1668                 return err;
1669
1670         scsi_run_queue(sdev->request_queue);
1671         while (sdev->device_busy) {
1672                 schedule_timeout(HZ/5);
1673                 scsi_run_queue(sdev->request_queue);
1674         }
1675         return 0;
1676 }
1677 EXPORT_SYMBOL(scsi_device_quiesce);
1678
1679 /**
1680  *      scsi_device_resume - Restart user issued commands to a quiesced device.
1681  *      @sdev:  scsi device to resume.
1682  *
1683  *      Moves the device from quiesced back to running and restarts the
1684  *      queues.
1685  *
1686  *      Must be called with user context, may sleep.
1687  **/
1688 void
1689 scsi_device_resume(struct scsi_device *sdev)
1690 {
1691         if(scsi_device_set_state(sdev, SDEV_RUNNING))
1692                 return;
1693         scsi_run_queue(sdev->request_queue);
1694 }
1695 EXPORT_SYMBOL(scsi_device_resume);
1696