drivers/scsi/scsi_lib.c

   1 /*
   2  *  scsi_lib.c Copyright (C) 1999 Eric Youngdale
   3  *
   4  *  SCSI queueing library.
   5  *      Initial versions: Eric Youngdale (eric@andante.org).
   6  *                        Based upon conversations with large numbers
   7  *                        of people at Linux Expo.
   8  */
   9
  10 #include <linux/bio.h>
  11 #include <linux/bitops.h>
  12 #include <linux/blkdev.h>
  13 #include <linux/completion.h>
  14 #include <linux/kernel.h>
  15 #include <linux/export.h>
  16 #include <linux/mempool.h>
  17 #include <linux/slab.h>
  18 #include <linux/init.h>
  19 #include <linux/pci.h>
  20 #include <linux/delay.h>
  21 #include <linux/hardirq.h>
  22 #include <linux/scatterlist.h>
  23
  24 #include <scsi/scsi.h>
  25 #include <scsi/scsi_cmnd.h>
  26 #include <scsi/scsi_dbg.h>
  27 #include <scsi/scsi_device.h>
  28 #include <scsi/scsi_driver.h>
  29 #include <scsi/scsi_eh.h>
  30 #include <scsi/scsi_host.h>
  31
  32 #include "scsi_priv.h"
  33 #include "scsi_logging.h"
  34
  35
  36 #define SG_MEMPOOL_NR           ARRAY_SIZE(scsi_sg_pools)
  37 #define SG_MEMPOOL_SIZE         2
  38
  39 struct scsi_host_sg_pool {
  40         size_t          size;
  41         char            *name;
  42         struct kmem_cache       *slab;
  43         mempool_t       *pool;
  44 };
  45
  46 #define SP(x) { x, "sgpool-" __stringify(x) }
  47 #if (SCSI_MAX_SG_SEGMENTS < 32)
  48 #error SCSI_MAX_SG_SEGMENTS is too small (must be 32 or greater)
  49 #endif
  50 static struct scsi_host_sg_pool scsi_sg_pools[] = {
  51         SP(8),
  52         SP(16),
  53 #if (SCSI_MAX_SG_SEGMENTS > 32)
  54         SP(32),
  55 #if (SCSI_MAX_SG_SEGMENTS > 64)
  56         SP(64),
  57 #if (SCSI_MAX_SG_SEGMENTS > 128)
  58         SP(128),
  59 #if (SCSI_MAX_SG_SEGMENTS > 256)
  60 #error SCSI_MAX_SG_SEGMENTS is too large (256 MAX)
  61 #endif
  62 #endif
  63 #endif
  64 #endif
  65         SP(SCSI_MAX_SG_SEGMENTS)
  66 };
  67 #undef SP
  68
  69 struct kmem_cache *scsi_sdb_cache;
  70
  71 /*
  72  * When to reinvoke queueing after a resource shortage. It's 3 msecs to
  73  * not change behaviour from the previous unplug mechanism, experimentation
  74  * may prove this needs changing.
  75  */
  76 #define SCSI_QUEUE_DELAY        3
  77
  78 /*
  79  * Function:    scsi_unprep_request()
  80  *
  81  * Purpose:     Remove all preparation done for a request, including its
  82  *              associated scsi_cmnd, so that it can be requeued.
  83  *
  84  * Arguments:   req     - request to unprepare
  85  *
  86  * Lock status: Assumed that no locks are held upon entry.
  87  *
  88  * Returns:     Nothing.
  89  */
  90 static void scsi_unprep_request(struct request *req)
  91 {
  92         struct scsi_cmnd *cmd = req->special;
  93
  94         blk_unprep_request(req);
  95         req->special = NULL;
  96
  97         scsi_put_command(cmd);
  98 }
  99
 100 /**
 101  * __scsi_queue_insert - private queue insertion
 102  * @cmd: The SCSI command being requeued
 103  * @reason:  The reason for the requeue
 104  * @unbusy: Whether the queue should be unbusied
 105  *
 106  * This is a private queue insertion.  The public interface
 107  * scsi_queue_insert() always assumes the queue should be unbusied
 108  * because it's always called before the completion.  This function is
 109  * for a requeue after completion, which should only occur in this
 110  * file.
 111  */
 112 static void __scsi_queue_insert(struct scsi_cmnd *cmd, int reason, int unbusy)
 113 {
 114         struct Scsi_Host *host = cmd->device->host;
 115         struct scsi_device *device = cmd->device;
 116         struct scsi_target *starget = scsi_target(device);
 117         struct request_queue *q = device->request_queue;
 118         unsigned long flags;
 119
 120         SCSI_LOG_MLQUEUE(1,
 121                  printk("Inserting command %p into mlqueue\n", cmd));
 122
 123         /*
 124          * Set the appropriate busy bit for the device/host.
 125          *
 126          * If the host/device isn't busy, assume that something actually
 127          * completed, and that we should be able to queue a command now.
 128          *
 129          * Note that the prior mid-layer assumption that any host could
 130          * always queue at least one command is now broken.  The mid-layer
 131          * will implement a user specifiable stall (see
 132          * scsi_host.max_host_blocked and scsi_device.max_device_blocked)
 133          * if a command is requeued with no other commands outstanding
 134          * either for the device or for the host.
 135          */
 136         switch (reason) {
 137         case SCSI_MLQUEUE_HOST_BUSY:
 138                 host->host_blocked = host->max_host_blocked;
 139                 break;
 140         case SCSI_MLQUEUE_DEVICE_BUSY:
 141         case SCSI_MLQUEUE_EH_RETRY:
 142                 device->device_blocked = device->max_device_blocked;
 143                 break;
 144         case SCSI_MLQUEUE_TARGET_BUSY:
 145                 starget->target_blocked = starget->max_target_blocked;
 146                 break;
 147         }
 148
 149         /*
 150          * Decrement the counters, since these commands are no longer
 151          * active on the host/device.
 152          */
 153         if (unbusy)
 154                 scsi_device_unbusy(device);
 155
 156         /*
 157          * Requeue this command.  It will go before all other commands
 158          * that are already in the queue. Schedule requeue work under
 159          * lock such that the kblockd_schedule_work() call happens
 160          * before blk_cleanup_queue() finishes.
 161          */
 162         spin_lock_irqsave(q->queue_lock, flags);
 163         blk_requeue_request(q, cmd->request);
 164         kblockd_schedule_work(q, &device->requeue_work);
 165         spin_unlock_irqrestore(q->queue_lock, flags);
 166 }
 167
 168 /*
 169  * Function:    scsi_queue_insert()
 170  *
 171  * Purpose:     Insert a command in the midlevel queue.
 172  *
 173  * Arguments:   cmd    - command that we are adding to queue.
 174  *              reason - why we are inserting command to queue.
 175  *
 176  * Lock status: Assumed that lock is not held upon entry.
 177  *
 178  * Returns:     Nothing.
 179  *
 180  * Notes:       We do this for one of two cases.  Either the host is busy
 181  *              and it cannot accept any more commands for the time being,
 182  *              or the device returned QUEUE_FULL and can accept no more
 183  *              commands.
 184  * Notes:       This could be called either from an interrupt context or a
 185  *              normal process context.
 186  */
 187 void scsi_queue_insert(struct scsi_cmnd *cmd, int reason)
 188 {
 189         __scsi_queue_insert(cmd, reason, 1);
 190 }
 191 /**
 192  * scsi_execute - insert request and wait for the result
 193  * @sdev:       scsi device
 194  * @cmd:        scsi command
 195  * @data_direction: data direction
 196  * @buffer:     data buffer
 197  * @bufflen:    len of buffer
 198  * @sense:      optional sense buffer
 199  * @timeout:    request timeout in seconds
 200  * @retries:    number of times to retry request
 201  * @flags:      or into request flags;
 202  * @resid:      optional residual length
 203  *
 204  * returns the req->errors value which is the scsi_cmnd result
 205  * field.
 206  */
 207 int scsi_execute(struct scsi_device *sdev, const unsigned char *cmd,
 208                  int data_direction, void *buffer, unsigned bufflen,
 209                  unsigned char *sense, int timeout, int retries, int flags,
 210                  int *resid)
 211 {
 212         struct request *req;
 213         int write = (data_direction == DMA_TO_DEVICE);
 214         int ret = DRIVER_ERROR << 24;
 215
 216         req = blk_get_request(sdev->request_queue, write, __GFP_WAIT);
 217         if (!req)
 218                 return ret;
 219
 220         if (bufflen &&  blk_rq_map_kern(sdev->request_queue, req,
 221                                         buffer, bufflen, __GFP_WAIT))
 222                 goto out;
 223
 224         req->cmd_len = COMMAND_SIZE(cmd[0]);
 225         memcpy(req->cmd, cmd, req->cmd_len);
 226         req->sense = sense;
 227         req->sense_len = 0;
 228         req->retries = retries;
 229         req->timeout = timeout;
 230         req->cmd_type = REQ_TYPE_BLOCK_PC;
 231         req->cmd_flags |= flags | REQ_QUIET | REQ_PREEMPT;
 232
 233         /*
 234          * head injection *required* here otherwise quiesce won't work
 235          */
 236         blk_execute_rq(req->q, NULL, req, 1);
 237
 238         /*
 239          * Some devices (USB mass-storage in particular) may transfer
 240          * garbage data together with a residue indicating that the data
 241          * is invalid.  Prevent the garbage from being misinterpreted
 242          * and prevent security leaks by zeroing out the excess data.
 243          */
 244         if (unlikely(req->resid_len > 0 && req->resid_len <= bufflen))
 245                 memset(buffer + (bufflen - req->resid_len), 0, req->resid_len);
 246
 247         if (resid)
 248                 *resid = req->resid_len;
 249         ret = req->errors;
 250  out:
 251         blk_put_request(req);
 252
 253         return ret;
 254 }
 255 EXPORT_SYMBOL(scsi_execute);
 256
 257 int scsi_execute_req_flags(struct scsi_device *sdev, const unsigned char *cmd,
 258                      int data_direction, void *buffer, unsigned bufflen,
 259                      struct scsi_sense_hdr *sshdr, int timeout, int retries,
 260                      int *resid, int flags)
 261 {
 262         char *sense = NULL;
 263         int result;
 264
 265         if (sshdr) {
 266                 sense = kzalloc(SCSI_SENSE_BUFFERSIZE, GFP_NOIO);
 267                 if (!sense)
 268                         return DRIVER_ERROR << 24;
 269         }
 270         result = scsi_execute(sdev, cmd, data_direction, buffer, bufflen,
 271                               sense, timeout, retries, flags, resid);
 272         if (sshdr)
 273                 scsi_normalize_sense(sense, SCSI_SENSE_BUFFERSIZE, sshdr);
 274
 275         kfree(sense);
 276         return result;
 277 }
 278 EXPORT_SYMBOL(scsi_execute_req_flags);
 279
 280 /*
 281  * Function:    scsi_init_cmd_errh()
 282  *
 283  * Purpose:     Initialize cmd fields related to error handling.
 284  *
 285  * Arguments:   cmd     - command that is ready to be queued.
 286  *
 287  * Notes:       This function has the job of initializing a number of
 288  *              fields related to error handling.   Typically this will
 289  *              be called once for each command, as required.
 290  */
 291 static void scsi_init_cmd_errh(struct scsi_cmnd *cmd)
 292 {
 293         cmd->serial_number = 0;
 294         scsi_set_resid(cmd, 0);
 295         memset(cmd->sense_buffer, 0, SCSI_SENSE_BUFFERSIZE);
 296         if (cmd->cmd_len == 0)
 297                 cmd->cmd_len = scsi_command_size(cmd->cmnd);
 298 }
 299
 300 void scsi_device_unbusy(struct scsi_device *sdev)
 301 {
 302         struct Scsi_Host *shost = sdev->host;
 303         struct scsi_target *starget = scsi_target(sdev);
 304         unsigned long flags;
 305
 306         spin_lock_irqsave(shost->host_lock, flags);
 307         shost->host_busy--;
 308         starget->target_busy--;
 309         if (unlikely(scsi_host_in_recovery(shost) &&
 310                      (shost->host_failed || shost->host_eh_scheduled)))
 311                 scsi_eh_wakeup(shost);
 312         spin_unlock(shost->host_lock);
 313         spin_lock(sdev->request_queue->queue_lock);
 314         sdev->device_busy--;
 315         spin_unlock_irqrestore(sdev->request_queue->queue_lock, flags);
 316 }
 317
 318 /*
 319  * Called for single_lun devices on IO completion. Clear starget_sdev_user,
 320  * and call blk_run_queue for all the scsi_devices on the target -
 321  * including current_sdev first.
 322  *
 323  * Called with *no* scsi locks held.
 324  */
 325 static void scsi_single_lun_run(struct scsi_device *current_sdev)
 326 {
 327         struct Scsi_Host *shost = current_sdev->host;
 328         struct scsi_device *sdev, *tmp;
 329         struct scsi_target *starget = scsi_target(current_sdev);
 330         unsigned long flags;
 331
 332         spin_lock_irqsave(shost->host_lock, flags);
 333         starget->starget_sdev_user = NULL;
 334         spin_unlock_irqrestore(shost->host_lock, flags);
 335
 336         /*
 337          * Call blk_run_queue for all LUNs on the target, starting with
 338          * current_sdev. We race with others (to set starget_sdev_user),
 339          * but in most cases, we will be first. Ideally, each LU on the
 340          * target would get some limited time or requests on the target.
 341          */
 342         blk_run_queue(current_sdev->request_queue);
 343
 344         spin_lock_irqsave(shost->host_lock, flags);
 345         if (starget->starget_sdev_user)
 346                 goto out;
 347         list_for_each_entry_safe(sdev, tmp, &starget->devices,
 348                         same_target_siblings) {
 349                 if (sdev == current_sdev)
 350                         continue;
 351                 if (scsi_device_get(sdev))
 352                         continue;
 353
 354                 spin_unlock_irqrestore(shost->host_lock, flags);
 355                 blk_run_queue(sdev->request_queue);
 356                 spin_lock_irqsave(shost->host_lock, flags);
 357
 358                 scsi_device_put(sdev);
 359         }
 360  out:
 361         spin_unlock_irqrestore(shost->host_lock, flags);
 362 }
 363
 364 static inline int scsi_device_is_busy(struct scsi_device *sdev)
 365 {
 366         if (sdev->device_busy >= sdev->queue_depth || sdev->device_blocked)
 367                 return 1;
 368
 369         return 0;
 370 }
 371
 372 static inline int scsi_target_is_busy(struct scsi_target *starget)
 373 {
 374         return ((starget->can_queue > 0 &&
 375                  starget->target_busy >= starget->can_queue) ||
 376                  starget->target_blocked);
 377 }
 378
 379 static inline int scsi_host_is_busy(struct Scsi_Host *shost)
 380 {
 381         if ((shost->can_queue > 0 && shost->host_busy >= shost->can_queue) ||
 382             shost->host_blocked || shost->host_self_blocked)
 383                 return 1;
 384
 385         return 0;
 386 }
 387
 388 /*
 389  * Function:    scsi_run_queue()
 390  *
 391  * Purpose:     Select a proper request queue to serve next
 392  *
 393  * Arguments:   q       - last request's queue
 394  *
 395  * Returns:     Nothing
 396  *
 397  * Notes:       The previous command was completely finished, start
 398  *              a new one if possible.
 399  */
 400 static void scsi_run_queue(struct request_queue *q)
 401 {
 402         struct scsi_device *sdev = q->queuedata;
 403         struct Scsi_Host *shost;
 404         LIST_HEAD(starved_list);
 405         unsigned long flags;
 406
 407         shost = sdev->host;
 408         if (scsi_target(sdev)->single_lun)
 409                 scsi_single_lun_run(sdev);
 410
 411         spin_lock_irqsave(shost->host_lock, flags);
 412         list_splice_init(&shost->starved_list, &starved_list);
 413
 414         while (!list_empty(&starved_list)) {
 415                 struct request_queue *slq;
 416
 417                 /*
 418                  * As long as shost is accepting commands and we have
 419                  * starved queues, call blk_run_queue. scsi_request_fn
 420                  * drops the queue_lock and can add us back to the
 421                  * starved_list.
 422                  *
 423                  * host_lock protects the starved_list and starved_entry.
 424                  * scsi_request_fn must get the host_lock before checking
 425                  * or modifying starved_list or starved_entry.
 426                  */
 427                 if (scsi_host_is_busy(shost))
 428                         break;
 429
 430                 sdev = list_entry(starved_list.next,
 431                                   struct scsi_device, starved_entry);
 432                 list_del_init(&sdev->starved_entry);
 433                 if (scsi_target_is_busy(scsi_target(sdev))) {
 434                         list_move_tail(&sdev->starved_entry,
 435                                        &shost->starved_list);
 436                         continue;
 437                 }
 438
 439                 /*
 440                  * Once we drop the host lock, a racing scsi_remove_device()
 441                  * call may remove the sdev from the starved list and destroy
 442                  * it and the queue.  Mitigate by taking a reference to the
 443                  * queue and never touching the sdev again after we drop the
 444                  * host lock.  Note: if __scsi_remove_device() invokes
 445                  * blk_cleanup_queue() before the queue is run from this
 446                  * function then blk_run_queue() will return immediately since
 447                  * blk_cleanup_queue() marks the queue with QUEUE_FLAG_DYING.
 448                  */
 449                 slq = sdev->request_queue;
 450                 if (!blk_get_queue(slq))
 451                         continue;
 452                 spin_unlock_irqrestore(shost->host_lock, flags);
 453
 454                 blk_run_queue(slq);
 455                 blk_put_queue(slq);
 456
 457                 spin_lock_irqsave(shost->host_lock, flags);
 458         }
 459         /* put any unprocessed entries back */
 460         list_splice(&starved_list, &shost->starved_list);
 461         spin_unlock_irqrestore(shost->host_lock, flags);
 462
 463         blk_run_queue(q);
 464 }
 465
 466 void scsi_requeue_run_queue(struct work_struct *work)
 467 {
 468         struct scsi_device *sdev;
 469         struct request_queue *q;
 470
 471         sdev = container_of(work, struct scsi_device, requeue_work);
 472         q = sdev->request_queue;
 473         scsi_run_queue(q);
 474 }
 475
 476 /*
 477  * Function:    scsi_requeue_command()
 478  *
 479  * Purpose:     Handle post-processing of completed commands.
 480  *
 481  * Arguments:   q       - queue to operate on
 482  *              cmd     - command that may need to be requeued.
 483  *
 484  * Returns:     Nothing
 485  *
 486  * Notes:       After command completion, there may be blocks left
 487  *              over which weren't finished by the previous command
 488  *              this can be for a number of reasons - the main one is
 489  *              I/O errors in the middle of the request, in which case
 490  *              we need to request the blocks that come after the bad
 491  *              sector.
 492  * Notes:       Upon return, cmd is a stale pointer.
 493  */
 494 static void scsi_requeue_command(struct request_queue *q, struct scsi_cmnd *cmd)
 495 {
 496         struct scsi_device *sdev = cmd->device;
 497         struct request *req = cmd->request;
 498         unsigned long flags;
 499
 500         /*
 501          * We need to hold a reference on the device to avoid the queue being
 502          * killed after the unlock and before scsi_run_queue is invoked which
 503          * may happen because scsi_unprep_request() puts the command which
 504          * releases its reference on the device.
 505          */
 506         get_device(&sdev->sdev_gendev);
 507
 508         spin_lock_irqsave(q->queue_lock, flags);
 509         scsi_unprep_request(req);
 510         blk_requeue_request(q, req);
 511         spin_unlock_irqrestore(q->queue_lock, flags);
 512
 513         scsi_run_queue(q);
 514
 515         put_device(&sdev->sdev_gendev);
 516 }
 517
 518 void scsi_next_command(struct scsi_cmnd *cmd)
 519 {
 520         struct scsi_device *sdev = cmd->device;
 521         struct request_queue *q = sdev->request_queue;
 522
 523         /* need to hold a reference on the device before we let go of the cmd */
 524         get_device(&sdev->sdev_gendev);
 525
 526         scsi_put_command(cmd);
 527         scsi_run_queue(q);
 528
 529         /* ok to remove device now */
 530         put_device(&sdev->sdev_gendev);
 531 }
 532
 533 void scsi_run_host_queues(struct Scsi_Host *shost)
 534 {
 535         struct scsi_device *sdev;
 536
 537         shost_for_each_device(sdev, shost)
 538                 scsi_run_queue(sdev->request_queue);
 539 }
 540
 541 static void __scsi_release_buffers(struct scsi_cmnd *, int);
 542
 543 /*
 544  * Function:    scsi_end_request()
 545  *
 546  * Purpose:     Post-processing of completed commands (usually invoked at end
 547  *              of upper level post-processing and scsi_io_completion).
 548  *
 549  * Arguments:   cmd      - command that is complete.
 550  *              error    - 0 if I/O indicates success, < 0 for I/O error.
 551  *              bytes    - number of bytes of completed I/O
 552  *              requeue  - indicates whether we should requeue leftovers.
 553  *
 554  * Lock status: Assumed that lock is not held upon entry.
 555  *
 556  * Returns:     cmd if requeue required, NULL otherwise.
 557  *
 558  * Notes:       This is called for block device requests in order to
 559  *              mark some number of sectors as complete.
 560  *
 561  *              We are guaranteeing that the request queue will be goosed
 562  *              at some point during this call.
 563  * Notes:       If cmd was requeued, upon return it will be a stale pointer.
 564  */
 565 static struct scsi_cmnd *scsi_end_request(struct scsi_cmnd *cmd, int error,
 566                                           int bytes, int requeue)
 567 {
 568         struct request_queue *q = cmd->device->request_queue;
 569         struct request *req = cmd->request;
 570
 571         /*
 572          * If there are blocks left over at the end, set up the command
 573          * to queue the remainder of them.
 574          */
 575         if (blk_end_request(req, error, bytes)) {
 576                 /* kill remainder if no retrys */
 577                 if (error && scsi_noretry_cmd(cmd))
 578                         blk_end_request_all(req, error);
 579                 else {
 580                         if (requeue) {
 581                                 /*
 582                                  * Bleah.  Leftovers again.  Stick the
 583                                  * leftovers in the front of the
 584                                  * queue, and goose the queue again.
 585                                  */
 586                                 scsi_release_buffers(cmd);
 587                                 scsi_requeue_command(q, cmd);
 588                                 cmd = NULL;
 589                         }
 590                         return cmd;
 591                 }
 592         }
 593
 594         /*
 595          * This will goose the queue request function at the end, so we don't
 596          * need to worry about launching another command.
 597          */
 598         __scsi_release_buffers(cmd, 0);
 599         scsi_next_command(cmd);
 600         return NULL;
 601 }
 602
 603 static inline unsigned int scsi_sgtable_index(unsigned short nents)
 604 {
 605         unsigned int index;
 606
 607         BUG_ON(nents > SCSI_MAX_SG_SEGMENTS);
 608
 609         if (nents <= 8)
 610                 index = 0;
 611         else
 612                 index = get_count_order(nents) - 3;
 613
 614         return index;
 615 }
 616
 617 static void scsi_sg_free(struct scatterlist *sgl, unsigned int nents)
 618 {
 619         struct scsi_host_sg_pool *sgp;
 620
 621         sgp = scsi_sg_pools + scsi_sgtable_index(nents);
 622         mempool_free(sgl, sgp->pool);
 623 }
 624
 625 static struct scatterlist *scsi_sg_alloc(unsigned int nents, gfp_t gfp_mask)
 626 {
 627         struct scsi_host_sg_pool *sgp;
 628
 629         sgp = scsi_sg_pools + scsi_sgtable_index(nents);
 630         return mempool_alloc(sgp->pool, gfp_mask);
 631 }
 632
 633 static int scsi_alloc_sgtable(struct scsi_data_buffer *sdb, int nents,
 634                               gfp_t gfp_mask)
 635 {
 636         int ret;
 637
 638         BUG_ON(!nents);
 639
 640         ret = __sg_alloc_table(&sdb->table, nents, SCSI_MAX_SG_SEGMENTS,
 641                                gfp_mask, scsi_sg_alloc);
 642         if (unlikely(ret))
 643                 __sg_free_table(&sdb->table, SCSI_MAX_SG_SEGMENTS,
 644                                 scsi_sg_free);
 645
 646         return ret;
 647 }
 648
 649 static void scsi_free_sgtable(struct scsi_data_buffer *sdb)
 650 {
 651         __sg_free_table(&sdb->table, SCSI_MAX_SG_SEGMENTS, scsi_sg_free);
 652 }
 653
 654 static void __scsi_release_buffers(struct scsi_cmnd *cmd, int do_bidi_check)
 655 {
 656
 657         if (cmd->sdb.table.nents)
 658                 scsi_free_sgtable(&cmd->sdb);
 659
 660         memset(&cmd->sdb, 0, sizeof(cmd->sdb));
 661
 662         if (do_bidi_check && scsi_bidi_cmnd(cmd)) {
 663                 struct scsi_data_buffer *bidi_sdb =
 664                         cmd->request->next_rq->special;
 665                 scsi_free_sgtable(bidi_sdb);
 666                 kmem_cache_free(scsi_sdb_cache, bidi_sdb);
 667                 cmd->request->next_rq->special = NULL;
 668         }
 669
 670         if (scsi_prot_sg_count(cmd))
 671                 scsi_free_sgtable(cmd->prot_sdb);
 672 }
 673
 674 /*
 675  * Function:    scsi_release_buffers()
 676  *
 677  * Purpose:     Completion processing for block device I/O requests.
 678  *
 679  * Arguments:   cmd     - command that we are bailing.
 680  *
 681  * Lock status: Assumed that no lock is held upon entry.
 682  *
 683  * Returns:     Nothing
 684  *
 685  * Notes:       In the event that an upper level driver rejects a
 686  *              command, we must release resources allocated during
 687  *              the __init_io() function.  Primarily this would involve
 688  *              the scatter-gather table, and potentially any bounce
 689  *              buffers.
 690  */
 691 void scsi_release_buffers(struct scsi_cmnd *cmd)
 692 {
 693         __scsi_release_buffers(cmd, 1);
 694 }
 695 EXPORT_SYMBOL(scsi_release_buffers);
 696
 697 /**
 698  * __scsi_error_from_host_byte - translate SCSI error code into errno
 699  * @cmd:        SCSI command (unused)
 700  * @result:     scsi error code
 701  *
 702  * Translate SCSI error code into standard UNIX errno.
 703  * Return values:
 704  * -ENOLINK     temporary transport failure
 705  * -EREMOTEIO   permanent target failure, do not retry
 706  * -EBADE       permanent nexus failure, retry on other path
 707  * -ENOSPC      No write space available
 708  * -ENODATA     Medium error
 709  * -EIO         unspecified I/O error
 710  */
 711 static int __scsi_error_from_host_byte(struct scsi_cmnd *cmd, int result)
 712 {
 713         int error = 0;
 714
 715         switch(host_byte(result)) {
 716         case DID_TRANSPORT_FAILFAST:
 717                 error = -ENOLINK;
 718                 break;
 719         case DID_TARGET_FAILURE:
 720                 set_host_byte(cmd, DID_OK);
 721                 error = -EREMOTEIO;
 722                 break;
 723         case DID_NEXUS_FAILURE:
 724                 set_host_byte(cmd, DID_OK);
 725                 error = -EBADE;
 726                 break;
 727         case DID_ALLOC_FAILURE:
 728                 set_host_byte(cmd, DID_OK);
 729                 error = -ENOSPC;
 730                 break;
 731         case DID_MEDIUM_ERROR:
 732                 set_host_byte(cmd, DID_OK);
 733                 error = -ENODATA;
 734                 break;
 735         default:
 736                 error = -EIO;
 737                 break;
 738         }
 739
 740         return error;
 741 }
 742
 743 /*
 744  * Function:    scsi_io_completion()
 745  *
 746  * Purpose:     Completion processing for block device I/O requests.
 747  *
 748  * Arguments:   cmd   - command that is finished.
 749  *
 750  * Lock status: Assumed that no lock is held upon entry.
 751  *
 752  * Returns:     Nothing
 753  *
 754  * Notes:       This function is matched in terms of capabilities to
 755  *              the function that created the scatter-gather list.
 756  *              In other words, if there are no bounce buffers
 757  *              (the normal case for most drivers), we don't need
 758  *              the logic to deal with cleaning up afterwards.
 759  *
 760  *              We must call scsi_end_request().  This will finish off
 761  *              the specified number of sectors.  If we are done, the
 762  *              command block will be released and the queue function
 763  *              will be goosed.  If we are not done then we have to
 764  *              figure out what to do next:
 765  *
 766  *              a) We can call scsi_requeue_command().  The request
 767  *                 will be unprepared and put back on the queue.  Then
 768  *                 a new command will be created for it.  This should
 769  *                 be used if we made forward progress, or if we want
 770  *                 to switch from READ(10) to READ(6) for example.
 771  *
 772  *              b) We can call scsi_queue_insert().  The request will
 773  *                 be put back on the queue and retried using the same
 774  *                 command as before, possibly after a delay.
 775  *
 776  *              c) We can call blk_end_request() with -EIO to fail
 777  *                 the remainder of the request.
 778  */
 779 void scsi_io_completion(struct scsi_cmnd *cmd, unsigned int good_bytes)
 780 {
 781         int result = cmd->result;
 782         struct request_queue *q = cmd->device->request_queue;
 783         struct request *req = cmd->request;
 784         int error = 0;
 785         struct scsi_sense_hdr sshdr;
 786         int sense_valid = 0;
 787         int sense_deferred = 0;
 788         enum {ACTION_FAIL, ACTION_REPREP, ACTION_RETRY,
 789               ACTION_DELAYED_RETRY} action;
 790         char *description = NULL;
 791
 792         if (result) {
 793                 sense_valid = scsi_command_normalize_sense(cmd, &sshdr);
 794                 if (sense_valid)
 795                         sense_deferred = scsi_sense_is_deferred(&sshdr);
 796         }
 797
 798         if (req->cmd_type == REQ_TYPE_BLOCK_PC) { /* SG_IO ioctl from block level */
 799                 if (result) {
 800                         if (sense_valid && req->sense) {
 801                                 /*
 802                                  * SG_IO wants current and deferred errors
 803                                  */
 804                                 int len = 8 + cmd->sense_buffer[7];
 805
 806                                 if (len > SCSI_SENSE_BUFFERSIZE)
 807                                         len = SCSI_SENSE_BUFFERSIZE;
 808                                 memcpy(req->sense, cmd->sense_buffer,  len);
 809                                 req->sense_len = len;
 810                         }
 811                         if (!sense_deferred)
 812                                 error = __scsi_error_from_host_byte(cmd, result);
 813                 }
 814                 /*
 815                  * __scsi_error_from_host_byte may have reset the host_byte
 816                  */
 817                 req->errors = cmd->result;
 818
 819                 req->resid_len = scsi_get_resid(cmd);
 820
 821                 if (scsi_bidi_cmnd(cmd)) {
 822                         /*
 823                          * Bidi commands Must be complete as a whole,
 824                          * both sides at once.
 825                          */
 826                         req->next_rq->resid_len = scsi_in(cmd)->resid;
 827
 828                         scsi_release_buffers(cmd);
 829                         blk_end_request_all(req, 0);
 830
 831                         scsi_next_command(cmd);
 832                         return;
 833                 }
 834         } else if (blk_rq_bytes(req) == 0 && result && !sense_deferred) {
 835                 /*
 836                  * Certain non BLOCK_PC requests are commands that don't
 837                  * actually transfer anything (FLUSH), so cannot use
 838                  * good_bytes != blk_rq_bytes(req) as the signal for an error.
 839                  * This sets the error explicitly for the problem case.
 840                  */
 841                 error = __scsi_error_from_host_byte(cmd, result);
 842         }
 843
 844         /* no bidi support for !REQ_TYPE_BLOCK_PC yet */
 845         BUG_ON(blk_bidi_rq(req));
 846
 847         /*
 848          * Next deal with any sectors which we were able to correctly
 849          * handle.
 850          */
 851         SCSI_LOG_HLCOMPLETE(1, printk("%u sectors total, "
 852                                       "%d bytes done.\n",
 853                                       blk_rq_sectors(req), good_bytes));
 854
 855         /*
 856          * Recovered errors need reporting, but they're always treated
 857          * as success, so fiddle the result code here.  For BLOCK_PC
 858          * we already took a copy of the original into rq->errors which
 859          * is what gets returned to the user
 860          */
 861         if (sense_valid && (sshdr.sense_key == RECOVERED_ERROR)) {
 862                 /* if ATA PASS-THROUGH INFORMATION AVAILABLE skip
 863                  * print since caller wants ATA registers. Only occurs on
 864                  * SCSI ATA PASS_THROUGH commands when CK_COND=1
 865                  */
 866                 if ((sshdr.asc == 0x0) && (sshdr.ascq == 0x1d))
 867                         ;
 868                 else if (!(req->cmd_flags & REQ_QUIET))
 869                         scsi_print_sense("", cmd);
 870                 result = 0;
 871                 /* BLOCK_PC may have set error */
 872                 error = 0;
 873         }
 874
 875         /*
 876          * A number of bytes were successfully read.  If there
 877          * are leftovers and there is some kind of error
 878          * (result != 0), retry the rest.
 879          */
 880         if (scsi_end_request(cmd, error, good_bytes, result == 0) == NULL)
 881                 return;
 882
 883         error = __scsi_error_from_host_byte(cmd, result);
 884
 885         if (host_byte(result) == DID_RESET) {
 886                 /* Third party bus reset or reset for error recovery
 887                  * reasons.  Just retry the command and see what
 888                  * happens.
 889                  */
 890                 action = ACTION_RETRY;
 891         } else if (sense_valid && !sense_deferred) {
 892                 switch (sshdr.sense_key) {
 893                 case UNIT_ATTENTION:
 894                         if (cmd->device->removable) {
 895                                 /* Detected disc change.  Set a bit
 896                                  * and quietly refuse further access.
 897                                  */
 898                                 cmd->device->changed = 1;
 899                                 description = "Media Changed";
 900                                 action = ACTION_FAIL;
 901                         } else {
 902                                 /* Must have been a power glitch, or a
 903                                  * bus reset.  Could not have been a
 904                                  * media change, so we just retry the
 905                                  * command and see what happens.
 906                                  */
 907                                 action = ACTION_RETRY;
 908                         }
 909                         break;
 910                 case ILLEGAL_REQUEST:
 911                         /* If we had an ILLEGAL REQUEST returned, then
 912                          * we may have performed an unsupported
 913                          * command.  The only thing this should be
 914                          * would be a ten byte read where only a six
 915                          * byte read was supported.  Also, on a system
 916                          * where READ CAPACITY failed, we may have
 917                          * read past the end of the disk.
 918                          */
 919                         if ((cmd->device->use_10_for_rw &&
 920                             sshdr.asc == 0x20 && sshdr.ascq == 0x00) &&
 921                             (cmd->cmnd[0] == READ_10 ||
 922                              cmd->cmnd[0] == WRITE_10)) {
 923                                 /* This will issue a new 6-byte command. */
 924                                 cmd->device->use_10_for_rw = 0;
 925                                 action = ACTION_REPREP;
 926                         } else if (sshdr.asc == 0x10) /* DIX */ {
 927                                 description = "Host Data Integrity Failure";
 928                                 action = ACTION_FAIL;
 929                                 error = -EILSEQ;
 930                         /* INVALID COMMAND OPCODE or INVALID FIELD IN CDB */
 931                         } else if (sshdr.asc == 0x20 || sshdr.asc == 0x24) {
 932                                 switch (cmd->cmnd[0]) {
 933                                 case UNMAP:
 934                                         description = "Discard failure";
 935                                         break;
 936                                 case WRITE_SAME:
 937                                 case WRITE_SAME_16:
 938                                         if (cmd->cmnd[1] & 0x8)
 939                                                 description = "Discard failure";
 940                                         else
 941                                                 description =
 942                                                         "Write same failure";
 943                                         break;
 944                                 default:
 945                                         description = "Invalid command failure";
 946                                         break;
 947                                 }
 948                                 action = ACTION_FAIL;
 949                                 error = -EREMOTEIO;
 950                         } else
 951                                 action = ACTION_FAIL;
 952                         break;
 953                 case ABORTED_COMMAND:
 954                         action = ACTION_FAIL;
 955                         if (sshdr.asc == 0x10) { /* DIF */
 956                                 description = "Target Data Integrity Failure";
 957                                 error = -EILSEQ;
 958                         }
 959                         break;
 960                 case NOT_READY:
 961                         /* If the device is in the process of becoming
 962                          * ready, or has a temporary blockage, retry.
 963                          */
 964                         if (sshdr.asc == 0x04) {
 965                                 switch (sshdr.ascq) {
 966                                 case 0x01: /* becoming ready */
 967                                 case 0x04: /* format in progress */
 968                                 case 0x05: /* rebuild in progress */
 969                                 case 0x06: /* recalculation in progress */
 970                                 case 0x07: /* operation in progress */
 971                                 case 0x08: /* Long write in progress */
 972                                 case 0x09: /* self test in progress */
 973                                 case 0x14: /* space allocation in progress */
 974                                         action = ACTION_DELAYED_RETRY;
 975                                         break;
 976                                 default:
 977                                         description = "Device not ready";
 978                                         action = ACTION_FAIL;
 979                                         break;
 980                                 }
 981                         } else {
 982                                 description = "Device not ready";
 983                                 action = ACTION_FAIL;
 984                         }
 985                         break;
 986                 case VOLUME_OVERFLOW:
 987                         /* See SSC3rXX or current. */
 988                         action = ACTION_FAIL;
 989                         break;
 990                 default:
 991                         description = "Unhandled sense code";
 992                         action = ACTION_FAIL;
 993                         break;
 994                 }
 995         } else {
 996                 description = "Unhandled error code";
 997                 action = ACTION_FAIL;
 998         }
 999
1000         switch (action) {
1001         case ACTION_FAIL:
1002                 /* Give up and fail the remainder of the request */
1003                 scsi_release_buffers(cmd);
1004                 if (!(req->cmd_flags & REQ_QUIET)) {
1005                         if (description)
1006                                 scmd_printk(KERN_INFO, cmd, "%s\n",
1007                                             description);
1008                         scsi_print_result(cmd);
1009                         if (driver_byte(result) & DRIVER_SENSE)
1010                                 scsi_print_sense("", cmd);
1011                         scsi_print_command(cmd);
1012                 }
1013                 if (blk_end_request_err(req, error))
1014                         scsi_requeue_command(q, cmd);
1015                 else
1016                         scsi_next_command(cmd);
1017                 break;
1018         case ACTION_REPREP:
1019                 /* Unprep the request and put it back at the head of the queue.
1020                  * A new command will be prepared and issued.
1021                  */
1022                 scsi_release_buffers(cmd);
1023                 scsi_requeue_command(q, cmd);
1024                 break;
1025         case ACTION_RETRY:
1026                 /* Retry the same command immediately */
1027                 __scsi_queue_insert(cmd, SCSI_MLQUEUE_EH_RETRY, 0);
1028                 break;
1029         case ACTION_DELAYED_RETRY:
1030                 /* Retry the same command after a delay */
1031                 __scsi_queue_insert(cmd, SCSI_MLQUEUE_DEVICE_BUSY, 0);
1032                 break;
1033         }
1034 }
1035
1036 static int scsi_init_sgtable(struct request *req, struct scsi_data_buffer *sdb,
1037                              gfp_t gfp_mask)
1038 {
1039         int count;
1040
1041         /*
1042          * If sg table allocation fails, requeue request later.
1043          */
1044         if (unlikely(scsi_alloc_sgtable(sdb, req->nr_phys_segments,
1045                                         gfp_mask))) {
1046                 return BLKPREP_DEFER;
1047         }
1048
1049         req->buffer = NULL;
1050
1051         /*
1052          * Next, walk the list, and fill in the addresses and sizes of
1053          * each segment.
1054          */
1055         count = blk_rq_map_sg(req->q, req, sdb->table.sgl);
1056         BUG_ON(count > sdb->table.nents);
1057         sdb->table.nents = count;
1058         sdb->length = blk_rq_bytes(req);
1059         return BLKPREP_OK;
1060 }
1061
1062 /*
1063  * Function:    scsi_init_io()
1064  *
1065  * Purpose:     SCSI I/O initialize function.
1066  *
1067  * Arguments:   cmd   - Command descriptor we wish to initialize
1068  *
1069  * Returns:     0 on success
1070  *              BLKPREP_DEFER if the failure is retryable
1071  *              BLKPREP_KILL if the failure is fatal
1072  */
1073 int scsi_init_io(struct scsi_cmnd *cmd, gfp_t gfp_mask)
1074 {
1075         struct request *rq = cmd->request;
1076
1077         int error = scsi_init_sgtable(rq, &cmd->sdb, gfp_mask);
1078         if (error)
1079                 goto err_exit;
1080
1081         if (blk_bidi_rq(rq)) {
1082                 struct scsi_data_buffer *bidi_sdb = kmem_cache_zalloc(
1083                         scsi_sdb_cache, GFP_ATOMIC);
1084                 if (!bidi_sdb) {
1085                         error = BLKPREP_DEFER;
1086                         goto err_exit;
1087                 }
1088
1089                 rq->next_rq->special = bidi_sdb;
1090                 error = scsi_init_sgtable(rq->next_rq, bidi_sdb, GFP_ATOMIC);
1091                 if (error)
1092                         goto err_exit;
1093         }
1094
1095         if (blk_integrity_rq(rq)) {
1096                 struct scsi_data_buffer *prot_sdb = cmd->prot_sdb;
1097                 int ivecs, count;
1098
1099                 BUG_ON(prot_sdb == NULL);
1100                 ivecs = blk_rq_count_integrity_sg(rq->q, rq->bio);
1101
1102                 if (scsi_alloc_sgtable(prot_sdb, ivecs, gfp_mask)) {
1103                         error = BLKPREP_DEFER;
1104                         goto err_exit;
1105                 }
1106
1107                 count = blk_rq_map_integrity_sg(rq->q, rq->bio,
1108                                                 prot_sdb->table.sgl);
1109                 BUG_ON(unlikely(count > ivecs));
1110                 BUG_ON(unlikely(count > queue_max_integrity_segments(rq->q)));
1111
1112                 cmd->prot_sdb = prot_sdb;
1113                 cmd->prot_sdb->table.nents = count;
1114         }
1115
1116         return BLKPREP_OK ;
1117
1118 err_exit:
1119         scsi_release_buffers(cmd);
1120         cmd->request->special = NULL;
1121         scsi_put_command(cmd);
1122         return error;
1123 }
1124 EXPORT_SYMBOL(scsi_init_io);
1125
1126 static struct scsi_cmnd *scsi_get_cmd_from_req(struct scsi_device *sdev,
1127                 struct request *req)
1128 {
1129         struct scsi_cmnd *cmd;
1130
1131         if (!req->special) {
1132                 cmd = scsi_get_command(sdev, GFP_ATOMIC);
1133                 if (unlikely(!cmd))
1134                         return NULL;
1135                 req->special = cmd;
1136         } else {
1137                 cmd = req->special;
1138         }
1139
1140         /* pull a tag out of the request if we have one */
1141         cmd->tag = req->tag;
1142         cmd->request = req;
1143
1144         cmd->cmnd = req->cmd;
1145         cmd->prot_op = SCSI_PROT_NORMAL;
1146
1147         return cmd;
1148 }
1149
1150 int scsi_setup_blk_pc_cmnd(struct scsi_device *sdev, struct request *req)
1151 {
1152         struct scsi_cmnd *cmd;
1153         int ret = scsi_prep_state_check(sdev, req);
1154
1155         if (ret != BLKPREP_OK)
1156                 return ret;
1157
1158         cmd = scsi_get_cmd_from_req(sdev, req);
1159         if (unlikely(!cmd))
1160                 return BLKPREP_DEFER;
1161
1162         /*
1163          * BLOCK_PC requests may transfer data, in which case they must
1164          * a bio attached to them.  Or they might contain a SCSI command
1165          * that does not transfer data, in which case they may optionally
1166          * submit a request without an attached bio.
1167          */
1168         if (req->bio) {
1169                 int ret;
1170
1171                 BUG_ON(!req->nr_phys_segments);
1172
1173                 ret = scsi_init_io(cmd, GFP_ATOMIC);
1174                 if (unlikely(ret))
1175                         return ret;
1176         } else {
1177                 BUG_ON(blk_rq_bytes(req));
1178
1179                 memset(&cmd->sdb, 0, sizeof(cmd->sdb));
1180                 req->buffer = NULL;
1181         }
1182
1183         cmd->cmd_len = req->cmd_len;
1184         if (!blk_rq_bytes(req))
1185                 cmd->sc_data_direction = DMA_NONE;
1186         else if (rq_data_dir(req) == WRITE)
1187                 cmd->sc_data_direction = DMA_TO_DEVICE;
1188         else
1189                 cmd->sc_data_direction = DMA_FROM_DEVICE;
1190
1191         cmd->transfersize = blk_rq_bytes(req);
1192         cmd->allowed = req->retries;
1193         return BLKPREP_OK;
1194 }
1195 EXPORT_SYMBOL(scsi_setup_blk_pc_cmnd);
1196
1197 /*
1198  * Setup a REQ_TYPE_FS command.  These are simple read/write request
1199  * from filesystems that still need to be translated to SCSI CDBs from
1200  * the ULD.
1201  */
1202 int scsi_setup_fs_cmnd(struct scsi_device *sdev, struct request *req)
1203 {
1204         struct scsi_cmnd *cmd;
1205         int ret = scsi_prep_state_check(sdev, req);
1206
1207         if (ret != BLKPREP_OK)
1208                 return ret;
1209
1210         if (unlikely(sdev->scsi_dh_data && sdev->scsi_dh_data->scsi_dh
1211                          && sdev->scsi_dh_data->scsi_dh->prep_fn)) {
1212                 ret = sdev->scsi_dh_data->scsi_dh->prep_fn(sdev, req);
1213                 if (ret != BLKPREP_OK)
1214                         return ret;
1215         }
1216
1217         /*
1218          * Filesystem requests must transfer data.
1219          */
1220         BUG_ON(!req->nr_phys_segments);
1221
1222         cmd = scsi_get_cmd_from_req(sdev, req);
1223         if (unlikely(!cmd))
1224                 return BLKPREP_DEFER;
1225
1226         memset(cmd->cmnd, 0, BLK_MAX_CDB);
1227         return scsi_init_io(cmd, GFP_ATOMIC);
1228 }
1229 EXPORT_SYMBOL(scsi_setup_fs_cmnd);
1230
1231 int scsi_prep_state_check(struct scsi_device *sdev, struct request *req)
1232 {
1233         int ret = BLKPREP_OK;
1234
1235         /*
1236          * If the device is not in running state we will reject some
1237          * or all commands.
1238          */
1239         if (unlikely(sdev->sdev_state != SDEV_RUNNING)) {
1240                 switch (sdev->sdev_state) {
1241                 case SDEV_OFFLINE:
1242                 case SDEV_TRANSPORT_OFFLINE:
1243                         /*
1244                          * If the device is offline we refuse to process any
1245                          * commands.  The device must be brought online
1246                          * before trying any recovery commands.
1247                          */
1248                         sdev_printk(KERN_ERR, sdev,
1249                                     "rejecting I/O to offline device\n");
1250                         ret = BLKPREP_KILL;
1251                         break;
1252                 case SDEV_DEL:
1253                         /*
1254                          * If the device is fully deleted, we refuse to
1255                          * process any commands as well.
1256                          */
1257                         sdev_printk(KERN_ERR, sdev,
1258                                     "rejecting I/O to dead device\n");
1259                         ret = BLKPREP_KILL;
1260                         break;
1261                 case SDEV_BLOCK:
1262                 case SDEV_CREATED_BLOCK:
1263                         ret = BLKPREP_DEFER;
1264                         break;
1265                 case SDEV_QUIESCE:
1266                         /*
1267                          * If the devices is blocked we defer normal commands.
1268                          */
1269                         if (!(req->cmd_flags & REQ_PREEMPT))
1270                                 ret = BLKPREP_DEFER;
1271                         break;
1272                 default:
1273                         /*
1274                          * For any other not fully online state we only allow
1275                          * special commands.  In particular any user initiated
1276                          * command is not allowed.
1277                          */
1278                         if (!(req->cmd_flags & REQ_PREEMPT))
1279                                 ret = BLKPREP_KILL;
1280                         break;
1281                 }
1282         }
1283         return ret;
1284 }
1285 EXPORT_SYMBOL(scsi_prep_state_check);
1286
1287 int scsi_prep_return(struct request_queue *q, struct request *req, int ret)
1288 {
1289         struct scsi_device *sdev = q->queuedata;
1290
1291         switch (ret) {
1292         case BLKPREP_KILL:
1293                 req->errors = DID_NO_CONNECT << 16;
1294                 /* release the command and kill it */
1295                 if (req->special) {
1296                         struct scsi_cmnd *cmd = req->special;
1297                         scsi_release_buffers(cmd);
1298                         scsi_put_command(cmd);
1299                         req->special = NULL;
1300                 }
1301                 break;
1302         case BLKPREP_DEFER:
1303                 /*
1304                  * If we defer, the blk_peek_request() returns NULL, but the
1305                  * queue must be restarted, so we schedule a callback to happen
1306                  * shortly.
1307                  */
1308                 if (sdev->device_busy == 0)
1309                         blk_delay_queue(q, SCSI_QUEUE_DELAY);
1310                 break;
1311         default:
1312                 req->cmd_flags |= REQ_DONTPREP;
1313         }
1314
1315         return ret;
1316 }
1317 EXPORT_SYMBOL(scsi_prep_return);
1318
1319 int scsi_prep_fn(struct request_queue *q, struct request *req)
1320 {
1321         struct scsi_device *sdev = q->queuedata;
1322         int ret = BLKPREP_KILL;
1323
1324         if (req->cmd_type == REQ_TYPE_BLOCK_PC)
1325                 ret = scsi_setup_blk_pc_cmnd(sdev, req);
1326         return scsi_prep_return(q, req, ret);
1327 }
1328 EXPORT_SYMBOL(scsi_prep_fn);
1329
1330 /*
1331  * scsi_dev_queue_ready: if we can send requests to sdev, return 1 else
1332  * return 0.
1333  *
1334  * Called with the queue_lock held.
1335  */
1336 static inline int scsi_dev_queue_ready(struct request_queue *q,
1337                                   struct scsi_device *sdev)
1338 {
1339         if (sdev->device_busy == 0 && sdev->device_blocked) {
1340                 /*
1341                  * unblock after device_blocked iterates to zero
1342                  */
1343                 if (--sdev->device_blocked == 0) {
1344                         SCSI_LOG_MLQUEUE(3,
1345                                    sdev_printk(KERN_INFO, sdev,
1346                                    "unblocking device at zero depth\n"));
1347                 } else {
1348                         blk_delay_queue(q, SCSI_QUEUE_DELAY);
1349                         return 0;
1350                 }
1351         }
1352         if (scsi_device_is_busy(sdev))
1353                 return 0;
1354
1355         return 1;
1356 }
1357
1358
1359 /*
1360  * scsi_target_queue_ready: checks if there we can send commands to target
1361  * @sdev: scsi device on starget to check.
1362  *
1363  * Called with the host lock held.
1364  */
1365 static inline int scsi_target_queue_ready(struct Scsi_Host *shost,
1366                                            struct scsi_device *sdev)
1367 {
1368         struct scsi_target *starget = scsi_target(sdev);
1369
1370         if (starget->single_lun) {
1371                 if (starget->starget_sdev_user &&
1372                     starget->starget_sdev_user != sdev)
1373                         return 0;
1374                 starget->starget_sdev_user = sdev;
1375         }
1376
1377         if (starget->target_busy == 0 && starget->target_blocked) {
1378                 /*
1379                  * unblock after target_blocked iterates to zero
1380                  */
1381                 if (--starget->target_blocked == 0) {
1382                         SCSI_LOG_MLQUEUE(3, starget_printk(KERN_INFO, starget,
1383                                          "unblocking target at zero depth\n"));
1384                 } else
1385                         return 0;
1386         }
1387
1388         if (scsi_target_is_busy(starget)) {
1389                 list_move_tail(&sdev->starved_entry, &shost->starved_list);
1390                 return 0;
1391         }
1392
1393         return 1;
1394 }
1395
1396 /*
1397  * scsi_host_queue_ready: if we can send requests to shost, return 1 else
1398  * return 0. We must end up running the queue again whenever 0 is
1399  * returned, else IO can hang.
1400  *
1401  * Called with host_lock held.
1402  */
1403 static inline int scsi_host_queue_ready(struct request_queue *q,
1404                                    struct Scsi_Host *shost,
1405                                    struct scsi_device *sdev)
1406 {
1407         if (scsi_host_in_recovery(shost))
1408                 return 0;
1409         if (shost->host_busy == 0 && shost->host_blocked) {
1410                 /*
1411                  * unblock after host_blocked iterates to zero
1412                  */
1413                 if (--shost->host_blocked == 0) {
1414                         SCSI_LOG_MLQUEUE(3,
1415                                 printk("scsi%d unblocking host at zero depth\n",
1416                                         shost->host_no));
1417                 } else {
1418                         return 0;
1419                 }
1420         }
1421         if (scsi_host_is_busy(shost)) {
1422                 if (list_empty(&sdev->starved_entry))
1423                         list_add_tail(&sdev->starved_entry, &shost->starved_list);
1424                 return 0;
1425         }
1426
1427         /* We're OK to process the command, so we can't be starved */
1428         if (!list_empty(&sdev->starved_entry))
1429                 list_del_init(&sdev->starved_entry);
1430
1431         return 1;
1432 }
1433
1434 /*
1435  * Busy state exporting function for request stacking drivers.
1436  *
1437  * For efficiency, no lock is taken to check the busy state of
1438  * shost/starget/sdev, since the returned value is not guaranteed and
1439  * may be changed after request stacking drivers call the function,
1440  * regardless of taking lock or not.
1441  *
1442  * When scsi can't dispatch I/Os anymore and needs to kill I/Os scsi
1443  * needs to return 'not busy'. Otherwise, request stacking drivers
1444  * may hold requests forever.
1445  */
1446 static int scsi_lld_busy(struct request_queue *q)
1447 {
1448         struct scsi_device *sdev = q->queuedata;
1449         struct Scsi_Host *shost;
1450
1451         if (blk_queue_dying(q))
1452                 return 0;
1453
1454         shost = sdev->host;
1455
1456         /*
1457          * Ignore host/starget busy state.
1458          * Since block layer does not have a concept of fairness across
1459          * multiple queues, congestion of host/starget needs to be handled
1460          * in SCSI layer.
1461          */
1462         if (scsi_host_in_recovery(shost) || scsi_device_is_busy(sdev))
1463                 return 1;
1464
1465         return 0;
1466 }
1467
1468 /*
1469  * Kill a request for a dead device
1470  */
1471 static void scsi_kill_request(struct request *req, struct request_queue *q)
1472 {
1473         struct scsi_cmnd *cmd = req->special;
1474         struct scsi_device *sdev;
1475         struct scsi_target *starget;
1476         struct Scsi_Host *shost;
1477
1478         blk_start_request(req);
1479
1480         scmd_printk(KERN_INFO, cmd, "killing request\n");
1481
1482         sdev = cmd->device;
1483         starget = scsi_target(sdev);
1484         shost = sdev->host;
1485         scsi_init_cmd_errh(cmd);
1486         cmd->result = DID_NO_CONNECT << 16;
1487         atomic_inc(&cmd->device->iorequest_cnt);
1488
1489         /*
1490          * SCSI request completion path will do scsi_device_unbusy(),
1491          * bump busy counts.  To bump the counters, we need to dance
1492          * with the locks as normal issue path does.
1493          */
1494         sdev->device_busy++;
1495         spin_unlock(sdev->request_queue->queue_lock);
1496         spin_lock(shost->host_lock);
1497         shost->host_busy++;
1498         starget->target_busy++;
1499         spin_unlock(shost->host_lock);
1500         spin_lock(sdev->request_queue->queue_lock);
1501
1502         blk_complete_request(req);
1503 }
1504
1505 static void scsi_softirq_done(struct request *rq)
1506 {
1507         struct scsi_cmnd *cmd = rq->special;
1508         unsigned long wait_for = (cmd->allowed + 1) * rq->timeout;
1509         int disposition;
1510
1511         INIT_LIST_HEAD(&cmd->eh_entry);
1512
1513         atomic_inc(&cmd->device->iodone_cnt);
1514         if (cmd->result)
1515                 atomic_inc(&cmd->device->ioerr_cnt);
1516
1517         disposition = scsi_decide_disposition(cmd);
1518         if (disposition != SUCCESS &&
1519             time_before(cmd->jiffies_at_alloc + wait_for, jiffies)) {
1520                 sdev_printk(KERN_ERR, cmd->device,
1521                             "timing out command, waited %lus\n",
1522                             wait_for/HZ);
1523                 disposition = SUCCESS;
1524         }
1525
1526         scsi_log_completion(cmd, disposition);
1527
1528         switch (disposition) {
1529                 case SUCCESS:
1530                         scsi_finish_command(cmd);
1531                         break;
1532                 case NEEDS_RETRY:
1533                         scsi_queue_insert(cmd, SCSI_MLQUEUE_EH_RETRY);
1534                         break;
1535                 case ADD_TO_MLQUEUE:
1536                         scsi_queue_insert(cmd, SCSI_MLQUEUE_DEVICE_BUSY);
1537                         break;
1538                 default:
1539                         if (!scsi_eh_scmd_add(cmd, 0))
1540                                 scsi_finish_command(cmd);
1541         }
1542 }
1543
1544 /*
1545  * Function:    scsi_request_fn()
1546  *
1547  * Purpose:     Main strategy routine for SCSI.
1548  *
1549  * Arguments:   q       - Pointer to actual queue.
1550  *
1551  * Returns:     Nothing
1552  *
1553  * Lock status: IO request lock assumed to be held when called.
1554  */
1555 static void scsi_request_fn(struct request_queue *q)
1556 {
1557         struct scsi_device *sdev = q->queuedata;
1558         struct Scsi_Host *shost;
1559         struct scsi_cmnd *cmd;
1560         struct request *req;
1561
1562         if(!get_device(&sdev->sdev_gendev))
1563                 /* We must be tearing the block queue down already */
1564                 return;
1565
1566         /*
1567          * To start with, we keep looping until the queue is empty, or until
1568          * the host is no longer able to accept any more requests.
1569          */
1570         shost = sdev->host;
1571         for (;;) {
1572                 int rtn;
1573                 /*
1574                  * get next queueable request.  We do this early to make sure
1575                  * that the request is fully prepared even if we cannot
1576                  * accept it.
1577                  */
1578                 req = blk_peek_request(q);
1579                 if (!req || !scsi_dev_queue_ready(q, sdev))
1580                         break;
1581
1582                 if (unlikely(!scsi_device_online(sdev))) {
1583                         sdev_printk(KERN_ERR, sdev,
1584                                     "rejecting I/O to offline device\n");
1585                         scsi_kill_request(req, q);
1586                         continue;
1587                 }
1588
1589
1590                 /*
1591                  * Remove the request from the request list.
1592                  */
1593                 if (!(blk_queue_tagged(q) && !blk_queue_start_tag(q, req)))
1594                         blk_start_request(req);
1595                 sdev->device_busy++;
1596
1597                 spin_unlock(q->queue_lock);
1598                 cmd = req->special;
1599                 if (unlikely(cmd == NULL)) {
1600                         printk(KERN_CRIT "impossible request in %s.\n"
1601                                          "please mail a stack trace to "
1602                                          "linux-scsi@vger.kernel.org\n",
1603                                          __func__);
1604                         blk_dump_rq_flags(req, "foo");
1605                         BUG();
1606                 }
1607                 spin_lock(shost->host_lock);
1608
1609                 /*
1610                  * We hit this when the driver is using a host wide
1611                  * tag map. For device level tag maps the queue_depth check
1612                  * in the device ready fn would prevent us from trying
1613                  * to allocate a tag. Since the map is a shared host resource
1614                  * we add the dev to the starved list so it eventually gets
1615                  * a run when a tag is freed.
1616                  */
1617                 if (blk_queue_tagged(q) && !blk_rq_tagged(req)) {
1618                         if (list_empty(&sdev->starved_entry))
1619                                 list_add_tail(&sdev->starved_entry,
1620                                               &shost->starved_list);
1621                         goto not_ready;
1622                 }
1623
1624                 if (!scsi_target_queue_ready(shost, sdev))
1625                         goto not_ready;
1626
1627                 if (!scsi_host_queue_ready(q, shost, sdev))
1628                         goto not_ready;
1629
1630                 scsi_target(sdev)->target_busy++;
1631                 shost->host_busy++;
1632
1633                 /*
1634                  * XXX(hch): This is rather suboptimal, scsi_dispatch_cmd will
1635                  *              take the lock again.
1636                  */
1637                 spin_unlock_irq(shost->host_lock);
1638
1639                 /*
1640                  * Finally, initialize any error handling parameters, and set up
1641                  * the timers for timeouts.
1642                  */
1643                 scsi_init_cmd_errh(cmd);
1644
1645                 /*
1646                  * Dispatch the command to the low-level driver.
1647                  */
1648                 rtn = scsi_dispatch_cmd(cmd);
1649                 spin_lock_irq(q->queue_lock);
1650                 if (rtn)
1651                         goto out_delay;
1652         }
1653
1654         goto out;
1655
1656  not_ready:
1657         spin_unlock_irq(shost->host_lock);
1658
1659         /*
1660          * lock q, handle tag, requeue req, and decrement device_busy. We
1661          * must return with queue_lock held.
1662          *
1663          * Decrementing device_busy without checking it is OK, as all such
1664          * cases (host limits or settings) should run the queue at some
1665          * later time.
1666          */
1667         spin_lock_irq(q->queue_lock);
1668         blk_requeue_request(q, req);
1669         sdev->device_busy--;
1670 out_delay:
1671         if (sdev->device_busy == 0)
1672                 blk_delay_queue(q, SCSI_QUEUE_DELAY);
1673 out:
1674         /* must be careful here...if we trigger the ->remove() function
1675          * we cannot be holding the q lock */
1676         spin_unlock_irq(q->queue_lock);
1677         put_device(&sdev->sdev_gendev);
1678         spin_lock_irq(q->queue_lock);
1679 }
1680
1681 u64 scsi_calculate_bounce_limit(struct Scsi_Host *shost)
1682 {
1683         struct device *host_dev;
1684         u64 bounce_limit = 0xffffffff;
1685
1686         if (shost->unchecked_isa_dma)
1687                 return BLK_BOUNCE_ISA;
1688         /*
1689          * Platforms with virtual-DMA translation
1690          * hardware have no practical limit.
1691          */
1692         if (!PCI_DMA_BUS_IS_PHYS)
1693                 return BLK_BOUNCE_ANY;
1694
1695         host_dev = scsi_get_device(shost);
1696         if (host_dev && host_dev->dma_mask)
1697                 bounce_limit = (u64)dma_max_pfn(host_dev) << PAGE_SHIFT;
1698
1699         return bounce_limit;
1700 }
1701 EXPORT_SYMBOL(scsi_calculate_bounce_limit);
1702
1703 struct request_queue *__scsi_alloc_queue(struct Scsi_Host *shost,
1704                                          request_fn_proc *request_fn)
1705 {
1706         struct request_queue *q;
1707         struct device *dev = shost->dma_dev;
1708
1709         q = blk_init_queue(request_fn, NULL);
1710         if (!q)
1711                 return NULL;
1712
1713         /*
1714          * this limit is imposed by hardware restrictions
1715          */
1716         blk_queue_max_segments(q, min_t(unsigned short, shost->sg_tablesize,
1717                                         SCSI_MAX_SG_CHAIN_SEGMENTS));
1718
1719         if (scsi_host_prot_dma(shost)) {
1720                 shost->sg_prot_tablesize =
1721                         min_not_zero(shost->sg_prot_tablesize,
1722                                      (unsigned short)SCSI_MAX_PROT_SG_SEGMENTS);
1723                 BUG_ON(shost->sg_prot_tablesize < shost->sg_tablesize);
1724                 blk_queue_max_integrity_segments(q, shost->sg_prot_tablesize);
1725         }
1726
1727         blk_queue_max_hw_sectors(q, shost->max_sectors);
1728         blk_queue_bounce_limit(q, scsi_calculate_bounce_limit(shost));
1729         blk_queue_segment_boundary(q, shost->dma_boundary);
1730         dma_set_seg_boundary(dev, shost->dma_boundary);
1731
1732         blk_queue_max_segment_size(q, dma_get_max_seg_size(dev));
1733
1734         if (!shost->use_clustering)
1735                 q->limits.cluster = 0;
1736
1737         /*
1738          * set a reasonable default alignment on word boundaries: the
1739          * host and device may alter it using
1740          * blk_queue_update_dma_alignment() later.
1741          */
1742         blk_queue_dma_alignment(q, 0x03);
1743
1744         return q;
1745 }
1746 EXPORT_SYMBOL(__scsi_alloc_queue);
1747
1748 struct request_queue *scsi_alloc_queue(struct scsi_device *sdev)
1749 {
1750         struct request_queue *q;
1751
1752         q = __scsi_alloc_queue(sdev->host, scsi_request_fn);
1753         if (!q)
1754                 return NULL;
1755
1756         blk_queue_prep_rq(q, scsi_prep_fn);
1757         blk_queue_softirq_done(q, scsi_softirq_done);
1758         blk_queue_rq_timed_out(q, scsi_times_out);
1759         blk_queue_lld_busy(q, scsi_lld_busy);
1760         return q;
1761 }
1762
1763 /*
1764  * Function:    scsi_block_requests()
1765  *
1766  * Purpose:     Utility function used by low-level drivers to prevent further
1767  *              commands from being queued to the device.
1768  *
1769  * Arguments:   shost       - Host in question
1770  *
1771  * Returns:     Nothing
1772  *
1773  * Lock status: No locks are assumed held.
1774  *
1775  * Notes:       There is no timer nor any other means by which the requests
1776  *              get unblocked other than the low-level driver calling
1777  *              scsi_unblock_requests().
1778  */
1779 void scsi_block_requests(struct Scsi_Host *shost)
1780 {
1781         shost->host_self_blocked = 1;
1782 }
1783 EXPORT_SYMBOL(scsi_block_requests);
1784
1785 /*
1786  * Function:    scsi_unblock_requests()
1787  *
1788  * Purpose:     Utility function used by low-level drivers to allow further
1789  *              commands from being queued to the device.
1790  *
1791  * Arguments:   shost       - Host in question
1792  *
1793  * Returns:     Nothing
1794  *
1795  * Lock status: No locks are assumed held.
1796  *
1797  * Notes:       There is no timer nor any other means by which the requests
1798  *              get unblocked other than the low-level driver calling
1799  *              scsi_unblock_requests().
1800  *
1801  *              This is done as an API function so that changes to the
1802  *              internals of the scsi mid-layer won't require wholesale
1803  *              changes to drivers that use this feature.
1804  */
1805 void scsi_unblock_requests(struct Scsi_Host *shost)
1806 {
1807         shost->host_self_blocked = 0;
1808         scsi_run_host_queues(shost);
1809 }
1810 EXPORT_SYMBOL(scsi_unblock_requests);
1811
1812 int __init scsi_init_queue(void)
1813 {
1814         int i;
1815
1816         scsi_sdb_cache = kmem_cache_create("scsi_data_buffer",
1817                                            sizeof(struct scsi_data_buffer),
1818                                            0, 0, NULL);
1819         if (!scsi_sdb_cache) {
1820                 printk(KERN_ERR "SCSI: can't init scsi sdb cache\n");
1821                 return -ENOMEM;
1822         }
1823
1824         for (i = 0; i < SG_MEMPOOL_NR; i++) {
1825                 struct scsi_host_sg_pool *sgp = scsi_sg_pools + i;
1826                 int size = sgp->size * sizeof(struct scatterlist);
1827
1828                 sgp->slab = kmem_cache_create(sgp->name, size, 0,
1829                                 SLAB_HWCACHE_ALIGN, NULL);
1830                 if (!sgp->slab) {
1831                         printk(KERN_ERR "SCSI: can't init sg slab %s\n",
1832                                         sgp->name);
1833                         goto cleanup_sdb;
1834                 }
1835
1836                 sgp->pool = mempool_create_slab_pool(SG_MEMPOOL_SIZE,
1837                                                      sgp->slab);
1838                 if (!sgp->pool) {
1839                         printk(KERN_ERR "SCSI: can't init sg mempool %s\n",
1840                                         sgp->name);
1841                         goto cleanup_sdb;
1842                 }
1843         }
1844
1845         return 0;
1846
1847 cleanup_sdb:
1848         for (i = 0; i < SG_MEMPOOL_NR; i++) {
1849                 struct scsi_host_sg_pool *sgp = scsi_sg_pools + i;
1850                 if (sgp->pool)
1851                         mempool_destroy(sgp->pool);
1852                 if (sgp->slab)
1853                         kmem_cache_destroy(sgp->slab);
1854         }
1855         kmem_cache_destroy(scsi_sdb_cache);
1856
1857         return -ENOMEM;
1858 }
1859
1860 void scsi_exit_queue(void)
1861 {
1862         int i;
1863
1864         kmem_cache_destroy(scsi_sdb_cache);
1865
1866         for (i = 0; i < SG_MEMPOOL_NR; i++) {
1867                 struct scsi_host_sg_pool *sgp = scsi_sg_pools + i;
1868                 mempool_destroy(sgp->pool);
1869                 kmem_cache_destroy(sgp->slab);
1870         }
1871 }
1872
1873 /**
1874  *      scsi_mode_select - issue a mode select
1875  *      @sdev:  SCSI device to be queried
1876  *      @pf:    Page format bit (1 == standard, 0 == vendor specific)
1877  *      @sp:    Save page bit (0 == don't save, 1 == save)
1878  *      @modepage: mode page being requested
1879  *      @buffer: request buffer (may not be smaller than eight bytes)
1880  *      @len:   length of request buffer.
1881  *      @timeout: command timeout
1882  *      @retries: number of retries before failing
1883  *      @data: returns a structure abstracting the mode header data
1884  *      @sshdr: place to put sense data (or NULL if no sense to be collected).
1885  *              must be SCSI_SENSE_BUFFERSIZE big.
1886  *
1887  *      Returns zero if successful; negative error number or scsi
1888  *      status on error
1889  *
1890  */
1891 int
1892 scsi_mode_select(struct scsi_device *sdev, int pf, int sp, int modepage,
1893                  unsigned char *buffer, int len, int timeout, int retries,
1894                  struct scsi_mode_data *data, struct scsi_sense_hdr *sshdr)
1895 {
1896         unsigned char cmd[10];
1897         unsigned char *real_buffer;
1898         int ret;
1899
1900         memset(cmd, 0, sizeof(cmd));
1901         cmd[1] = (pf ? 0x10 : 0) | (sp ? 0x01 : 0);
1902
1903         if (sdev->use_10_for_ms) {
1904                 if (len > 65535)
1905                         return -EINVAL;
1906                 real_buffer = kmalloc(8 + len, GFP_KERNEL);
1907                 if (!real_buffer)
1908                         return -ENOMEM;
1909                 memcpy(real_buffer + 8, buffer, len);
1910                 len += 8;
1911                 real_buffer[0] = 0;
1912                 real_buffer[1] = 0;
1913                 real_buffer[2] = data->medium_type;
1914                 real_buffer[3] = data->device_specific;
1915                 real_buffer[4] = data->longlba ? 0x01 : 0;
1916                 real_buffer[5] = 0;
1917                 real_buffer[6] = data->block_descriptor_length >> 8;
1918                 real_buffer[7] = data->block_descriptor_length;
1919
1920                 cmd[0] = MODE_SELECT_10;
1921                 cmd[7] = len >> 8;
1922                 cmd[8] = len;
1923         } else {
1924                 if (len > 255 || data->block_descriptor_length > 255 ||
1925                     data->longlba)
1926                         return -EINVAL;
1927
1928                 real_buffer = kmalloc(4 + len, GFP_KERNEL);
1929                 if (!real_buffer)
1930                         return -ENOMEM;
1931                 memcpy(real_buffer + 4, buffer, len);
1932                 len += 4;
1933                 real_buffer[0] = 0;
1934                 real_buffer[1] = data->medium_type;
1935                 real_buffer[2] = data->device_specific;
1936                 real_buffer[3] = data->block_descriptor_length;
1937
1938
1939                 cmd[0] = MODE_SELECT;
1940                 cmd[4] = len;
1941         }
1942
1943         ret = scsi_execute_req(sdev, cmd, DMA_TO_DEVICE, real_buffer, len,
1944                                sshdr, timeout, retries, NULL);
1945         kfree(real_buffer);
1946         return ret;
1947 }
1948 EXPORT_SYMBOL_GPL(scsi_mode_select);
1949
1950 /**
1951  *      scsi_mode_sense - issue a mode sense, falling back from 10 to six bytes if necessary.
1952  *      @sdev:  SCSI device to be queried
1953  *      @dbd:   set if mode sense will allow block descriptors to be returned
1954  *      @modepage: mode page being requested
1955  *      @buffer: request buffer (may not be smaller than eight bytes)
1956  *      @len:   length of request buffer.
1957  *      @timeout: command timeout
1958  *      @retries: number of retries before failing
1959  *      @data: returns a structure abstracting the mode header data
1960  *      @sshdr: place to put sense data (or NULL if no sense to be collected).
1961  *              must be SCSI_SENSE_BUFFERSIZE big.
1962  *
1963  *      Returns zero if unsuccessful, or the header offset (either 4
1964  *      or 8 depending on whether a six or ten byte command was
1965  *      issued) if successful.
1966  */
1967 int
1968 scsi_mode_sense(struct scsi_device *sdev, int dbd, int modepage,
1969                   unsigned char *buffer, int len, int timeout, int retries,
1970                   struct scsi_mode_data *data, struct scsi_sense_hdr *sshdr)
1971 {
1972         unsigned char cmd[12];
1973         int use_10_for_ms;
1974         int header_length;
1975         int result;
1976         struct scsi_sense_hdr my_sshdr;
1977
1978         memset(data, 0, sizeof(*data));
1979         memset(&cmd[0], 0, 12);
1980         cmd[1] = dbd & 0x18;    /* allows DBD and LLBA bits */
1981         cmd[2] = modepage;
1982
1983         /* caller might not be interested in sense, but we need it */
1984         if (!sshdr)
1985                 sshdr = &my_sshdr;
1986
1987  retry:
1988         use_10_for_ms = sdev->use_10_for_ms;
1989
1990         if (use_10_for_ms) {
1991                 if (len < 8)
1992                         len = 8;
1993
1994                 cmd[0] = MODE_SENSE_10;
1995                 cmd[8] = len;
1996                 header_length = 8;
1997         } else {
1998                 if (len < 4)
1999                         len = 4;
2000
2001                 cmd[0] = MODE_SENSE;
2002                 cmd[4] = len;
2003                 header_length = 4;
2004         }
2005
2006         memset(buffer, 0, len);
2007
2008         result = scsi_execute_req(sdev, cmd, DMA_FROM_DEVICE, buffer, len,
2009                                   sshdr, timeout, retries, NULL);
2010
2011         /* This code looks awful: what it's doing is making sure an
2012          * ILLEGAL REQUEST sense return identifies the actual command
2013          * byte as the problem.  MODE_SENSE commands can return
2014          * ILLEGAL REQUEST if the code page isn't supported */
2015
2016         if (use_10_for_ms && !scsi_status_is_good(result) &&
2017             (driver_byte(result) & DRIVER_SENSE)) {
2018                 if (scsi_sense_valid(sshdr)) {
2019                         if ((sshdr->sense_key == ILLEGAL_REQUEST) &&
2020                             (sshdr->asc == 0x20) && (sshdr->ascq == 0)) {
2021                                 /*
2022                                  * Invalid command operation code
2023                                  */
2024                                 sdev->use_10_for_ms = 0;
2025                                 goto retry;
2026                         }
2027                 }
2028         }
2029
2030         if(scsi_status_is_good(result)) {
2031                 if (unlikely(buffer[0] == 0x86 && buffer[1] == 0x0b &&
2032                              (modepage == 6 || modepage == 8))) {
2033                         /* Initio breakage? */
2034                         header_length = 0;
2035                         data->length = 13;
2036                         data->medium_type = 0;
2037                         data->device_specific = 0;
2038                         data->longlba = 0;
2039                         data->block_descriptor_length = 0;
2040                 } else if(use_10_for_ms) {
2041                         data->length = buffer[0]*256 + buffer[1] + 2;
2042                         data->medium_type = buffer[2];
2043                         data->device_specific = buffer[3];
2044                         data->longlba = buffer[4] & 0x01;
2045                         data->block_descriptor_length = buffer[6]*256
2046                                 + buffer[7];
2047                 } else {
2048                         data->length = buffer[0] + 1;
2049                         data->medium_type = buffer[1];
2050                         data->device_specific = buffer[2];
2051                         data->block_descriptor_length = buffer[3];
2052                 }
2053                 data->header_length = header_length;
2054         }
2055
2056         return result;
2057 }
2058 EXPORT_SYMBOL(scsi_mode_sense);
2059
2060 /**
2061  *      scsi_test_unit_ready - test if unit is ready
2062  *      @sdev:  scsi device to change the state of.
2063  *      @timeout: command timeout
2064  *      @retries: number of retries before failing
2065  *      @sshdr_external: Optional pointer to struct scsi_sense_hdr for
2066  *              returning sense. Make sure that this is cleared before passing
2067  *              in.
2068  *
2069  *      Returns zero if unsuccessful or an error if TUR failed.  For
2070  *      removable media, UNIT_ATTENTION sets ->changed flag.
2071  **/
2072 int
2073 scsi_test_unit_ready(struct scsi_device *sdev, int timeout, int retries,
2074                      struct scsi_sense_hdr *sshdr_external)
2075 {
2076         char cmd[] = {
2077                 TEST_UNIT_READY, 0, 0, 0, 0, 0,
2078         };
2079         struct scsi_sense_hdr *sshdr;
2080         int result;
2081
2082         if (!sshdr_external)
2083                 sshdr = kzalloc(sizeof(*sshdr), GFP_KERNEL);
2084         else
2085                 sshdr = sshdr_external;
2086
2087         /* try to eat the UNIT_ATTENTION if there are enough retries */
2088         do {
2089                 result = scsi_execute_req(sdev, cmd, DMA_NONE, NULL, 0, sshdr,
2090                                           timeout, retries, NULL);
2091                 if (sdev->removable && scsi_sense_valid(sshdr) &&
2092                     sshdr->sense_key == UNIT_ATTENTION)
2093                         sdev->changed = 1;
2094         } while (scsi_sense_valid(sshdr) &&
2095                  sshdr->sense_key == UNIT_ATTENTION && --retries);
2096
2097         if (!sshdr_external)
2098                 kfree(sshdr);
2099         return result;
2100 }
2101 EXPORT_SYMBOL(scsi_test_unit_ready);
2102
2103 /**
2104  *      scsi_device_set_state - Take the given device through the device state model.
2105  *      @sdev:  scsi device to change the state of.
2106  *      @state: state to change to.
2107  *
2108  *      Returns zero if unsuccessful or an error if the requested
2109  *      transition is illegal.
2110  */
2111 int
2112 scsi_device_set_state(struct scsi_device *sdev, enum scsi_device_state state)
2113 {
2114         enum scsi_device_state oldstate = sdev->sdev_state;
2115
2116         if (state == oldstate)
2117                 return 0;
2118
2119         switch (state) {
2120         case SDEV_CREATED:
2121                 switch (oldstate) {
2122                 case SDEV_CREATED_BLOCK:
2123                         break;
2124                 default:
2125                         goto illegal;
2126                 }
2127                 break;
2128
2129         case SDEV_RUNNING:
2130                 switch (oldstate) {
2131                 case SDEV_CREATED:
2132                 case SDEV_OFFLINE:
2133                 case SDEV_TRANSPORT_OFFLINE:
2134                 case SDEV_QUIESCE:
2135                 case SDEV_BLOCK:
2136                         break;
2137                 default:
2138                         goto illegal;
2139                 }
2140                 break;
2141
2142         case SDEV_QUIESCE:
2143                 switch (oldstate) {
2144                 case SDEV_RUNNING:
2145                 case SDEV_OFFLINE:
2146                 case SDEV_TRANSPORT_OFFLINE:
2147                         break;
2148                 default:
2149                         goto illegal;
2150                 }
2151                 break;
2152
2153         case SDEV_OFFLINE:
2154         case SDEV_TRANSPORT_OFFLINE:
2155                 switch (oldstate) {
2156                 case SDEV_CREATED:
2157                 case SDEV_RUNNING:
2158                 case SDEV_QUIESCE:
2159                 case SDEV_BLOCK:
2160                         break;
2161                 default:
2162                         goto illegal;
2163                 }
2164                 break;
2165
2166         case SDEV_BLOCK:
2167                 switch (oldstate) {
2168                 case SDEV_RUNNING:
2169                 case SDEV_CREATED_BLOCK:
2170                         break;
2171                 default:
2172                         goto illegal;
2173                 }
2174                 break;
2175
2176         case SDEV_CREATED_BLOCK:
2177                 switch (oldstate) {
2178                 case SDEV_CREATED:
2179                         break;
2180                 default:
2181                         goto illegal;
2182                 }
2183                 break;
2184
2185         case SDEV_CANCEL:
2186                 switch (oldstate) {
2187                 case SDEV_CREATED:
2188                 case SDEV_RUNNING:
2189                 case SDEV_QUIESCE:
2190                 case SDEV_OFFLINE:
2191                 case SDEV_TRANSPORT_OFFLINE:
2192                 case SDEV_BLOCK:
2193                         break;
2194                 default:
2195                         goto illegal;
2196                 }
2197                 break;
2198
2199         case SDEV_DEL:
2200                 switch (oldstate) {
2201                 case SDEV_CREATED:
2202                 case SDEV_RUNNING:
2203                 case SDEV_OFFLINE:
2204                 case SDEV_TRANSPORT_OFFLINE:
2205                 case SDEV_CANCEL:
2206                 case SDEV_CREATED_BLOCK:
2207                         break;
2208                 default:
2209                         goto illegal;
2210                 }
2211                 break;
2212
2213         }
2214         sdev->sdev_state = state;
2215         return 0;
2216
2217  illegal:
2218         SCSI_LOG_ERROR_RECOVERY(1,
2219                                 sdev_printk(KERN_ERR, sdev,
2220                                             "Illegal state transition %s->%s\n",
2221                                             scsi_device_state_name(oldstate),
2222                                             scsi_device_state_name(state))
2223                                 );
2224         return -EINVAL;
2225 }
2226 EXPORT_SYMBOL(scsi_device_set_state);
2227
2228 /**
2229  *      sdev_evt_emit - emit a single SCSI device uevent
2230  *      @sdev: associated SCSI device
2231  *      @evt: event to emit
2232  *
2233  *      Send a single uevent (scsi_event) to the associated scsi_device.
2234  */
2235 static void scsi_evt_emit(struct scsi_device *sdev, struct scsi_event *evt)
2236 {
2237         int idx = 0;
2238         char *envp[3];
2239
2240         switch (evt->evt_type) {
2241         case SDEV_EVT_MEDIA_CHANGE:
2242                 envp[idx++] = "SDEV_MEDIA_CHANGE=1";
2243                 break;
2244         case SDEV_EVT_INQUIRY_CHANGE_REPORTED:
2245                 envp[idx++] = "SDEV_UA=INQUIRY_DATA_HAS_CHANGED";
2246                 break;
2247         case SDEV_EVT_CAPACITY_CHANGE_REPORTED:
2248                 envp[idx++] = "SDEV_UA=CAPACITY_DATA_HAS_CHANGED";
2249                 break;
2250         case SDEV_EVT_SOFT_THRESHOLD_REACHED_REPORTED:
2251                envp[idx++] = "SDEV_UA=THIN_PROVISIONING_SOFT_THRESHOLD_REACHED";
2252                 break;
2253         case SDEV_EVT_MODE_PARAMETER_CHANGE_REPORTED:
2254                 envp[idx++] = "SDEV_UA=MODE_PARAMETERS_CHANGED";
2255                 break;
2256         case SDEV_EVT_LUN_CHANGE_REPORTED:
2257                 envp[idx++] = "SDEV_UA=REPORTED_LUNS_DATA_HAS_CHANGED";
2258                 break;
2259         default:
2260                 /* do nothing */
2261                 break;
2262         }
2263
2264         envp[idx++] = NULL;
2265
2266         kobject_uevent_env(&sdev->sdev_gendev.kobj, KOBJ_CHANGE, envp);
2267 }
2268
2269 /**
2270  *      sdev_evt_thread - send a uevent for each scsi event
2271  *      @work: work struct for scsi_device
2272  *
2273  *      Dispatch queued events to their associated scsi_device kobjects
2274  *      as uevents.
2275  */
2276 void scsi_evt_thread(struct work_struct *work)
2277 {
2278         struct scsi_device *sdev;
2279         enum scsi_device_event evt_type;
2280         LIST_HEAD(event_list);
2281
2282         sdev = container_of(work, struct scsi_device, event_work);
2283
2284         for (evt_type = SDEV_EVT_FIRST; evt_type <= SDEV_EVT_LAST; evt_type++)
2285                 if (test_and_clear_bit(evt_type, sdev->pending_events))
2286                         sdev_evt_send_simple(sdev, evt_type, GFP_KERNEL);
2287
2288         while (1) {
2289                 struct scsi_event *evt;
2290                 struct list_head *this, *tmp;
2291                 unsigned long flags;
2292
2293                 spin_lock_irqsave(&sdev->list_lock, flags);
2294                 list_splice_init(&sdev->event_list, &event_list);
2295                 spin_unlock_irqrestore(&sdev->list_lock, flags);
2296
2297                 if (list_empty(&event_list))
2298                         break;
2299
2300                 list_for_each_safe(this, tmp, &event_list) {
2301                         evt = list_entry(this, struct scsi_event, node);
2302                         list_del(&evt->node);
2303                         scsi_evt_emit(sdev, evt);
2304                         kfree(evt);
2305                 }
2306         }
2307 }
2308
2309 /**
2310  *      sdev_evt_send - send asserted event to uevent thread
2311  *      @sdev: scsi_device event occurred on
2312  *      @evt: event to send
2313  *
2314  *      Assert scsi device event asynchronously.
2315  */
2316 void sdev_evt_send(struct scsi_device *sdev, struct scsi_event *evt)
2317 {
2318         unsigned long flags;
2319
2320 #if 0
2321         /* FIXME: currently this check eliminates all media change events
2322          * for polled devices.  Need to update to discriminate between AN
2323          * and polled events */
2324         if (!test_bit(evt->evt_type, sdev->supported_events)) {
2325                 kfree(evt);
2326                 return;
2327         }
2328 #endif
2329
2330         spin_lock_irqsave(&sdev->list_lock, flags);
2331         list_add_tail(&evt->node, &sdev->event_list);
2332         schedule_work(&sdev->event_work);
2333         spin_unlock_irqrestore(&sdev->list_lock, flags);
2334 }
2335 EXPORT_SYMBOL_GPL(sdev_evt_send);
2336
2337 /**
2338  *      sdev_evt_alloc - allocate a new scsi event
2339  *      @evt_type: type of event to allocate
2340  *      @gfpflags: GFP flags for allocation
2341  *
2342  *      Allocates and returns a new scsi_event.
2343  */
2344 struct scsi_event *sdev_evt_alloc(enum scsi_device_event evt_type,
2345                                   gfp_t gfpflags)
2346 {
2347         struct scsi_event *evt = kzalloc(sizeof(struct scsi_event), gfpflags);
2348         if (!evt)
2349                 return NULL;
2350
2351         evt->evt_type = evt_type;
2352         INIT_LIST_HEAD(&evt->node);
2353
2354         /* evt_type-specific initialization, if any */
2355         switch (evt_type) {
2356         case SDEV_EVT_MEDIA_CHANGE:
2357         case SDEV_EVT_INQUIRY_CHANGE_REPORTED:
2358         case SDEV_EVT_CAPACITY_CHANGE_REPORTED:
2359         case SDEV_EVT_SOFT_THRESHOLD_REACHED_REPORTED:
2360         case SDEV_EVT_MODE_PARAMETER_CHANGE_REPORTED:
2361         case SDEV_EVT_LUN_CHANGE_REPORTED:
2362         default:
2363                 /* do nothing */
2364                 break;
2365         }
2366
2367         return evt;
2368 }
2369 EXPORT_SYMBOL_GPL(sdev_evt_alloc);
2370
2371 /**
2372  *      sdev_evt_send_simple - send asserted event to uevent thread
2373  *      @sdev: scsi_device event occurred on
2374  *      @evt_type: type of event to send
2375  *      @gfpflags: GFP flags for allocation
2376  *
2377  *      Assert scsi device event asynchronously, given an event type.
2378  */
2379 void sdev_evt_send_simple(struct scsi_device *sdev,
2380                           enum scsi_device_event evt_type, gfp_t gfpflags)
2381 {
2382         struct scsi_event *evt = sdev_evt_alloc(evt_type, gfpflags);
2383         if (!evt) {
2384                 sdev_printk(KERN_ERR, sdev, "event %d eaten due to OOM\n",
2385                             evt_type);
2386                 return;
2387         }
2388
2389         sdev_evt_send(sdev, evt);
2390 }
2391 EXPORT_SYMBOL_GPL(sdev_evt_send_simple);
2392
2393 /**
2394  *      scsi_device_quiesce - Block user issued commands.
2395  *      @sdev:  scsi device to quiesce.
2396  *
2397  *      This works by trying to transition to the SDEV_QUIESCE state
2398  *      (which must be a legal transition).  When the device is in this
2399  *      state, only special requests will be accepted, all others will
2400  *      be deferred.  Since special requests may also be requeued requests,
2401  *      a successful return doesn't guarantee the device will be
2402  *      totally quiescent.
2403  *
2404  *      Must be called with user context, may sleep.
2405  *
2406  *      Returns zero if unsuccessful or an error if not.
2407  */
2408 int
2409 scsi_device_quiesce(struct scsi_device *sdev)
2410 {
2411         int err = scsi_device_set_state(sdev, SDEV_QUIESCE);
2412         if (err)
2413                 return err;
2414
2415         scsi_run_queue(sdev->request_queue);
2416         while (sdev->device_busy) {
2417                 msleep_interruptible(200);
2418                 scsi_run_queue(sdev->request_queue);
2419         }
2420         return 0;
2421 }
2422 EXPORT_SYMBOL(scsi_device_quiesce);
2423
2424 /**
2425  *      scsi_device_resume - Restart user issued commands to a quiesced device.
2426  *      @sdev:  scsi device to resume.
2427  *
2428  *      Moves the device from quiesced back to running and restarts the
2429  *      queues.
2430  *
2431  *      Must be called with user context, may sleep.
2432  */
2433 void scsi_device_resume(struct scsi_device *sdev)
2434 {
2435         /* check if the device state was mutated prior to resume, and if
2436          * so assume the state is being managed elsewhere (for example
2437          * device deleted during suspend)
2438          */
2439         if (sdev->sdev_state != SDEV_QUIESCE ||
2440             scsi_device_set_state(sdev, SDEV_RUNNING))
2441                 return;
2442         scsi_run_queue(sdev->request_queue);
2443 }
2444 EXPORT_SYMBOL(scsi_device_resume);
2445
2446 static void
2447 device_quiesce_fn(struct scsi_device *sdev, void *data)
2448 {
2449         scsi_device_quiesce(sdev);
2450 }
2451
2452 void
2453 scsi_target_quiesce(struct scsi_target *starget)
2454 {
2455         starget_for_each_device(starget, NULL, device_quiesce_fn);
2456 }
2457 EXPORT_SYMBOL(scsi_target_quiesce);
2458
2459 static void
2460 device_resume_fn(struct scsi_device *sdev, void *data)
2461 {
2462         scsi_device_resume(sdev);
2463 }
2464
2465 void
2466 scsi_target_resume(struct scsi_target *starget)
2467 {
2468         starget_for_each_device(starget, NULL, device_resume_fn);
2469 }
2470 EXPORT_SYMBOL(scsi_target_resume);
2471
2472 /**
2473  * scsi_internal_device_block - internal function to put a device temporarily into the SDEV_BLOCK state
2474  * @sdev:       device to block
2475  *
2476  * Block request made by scsi lld's to temporarily stop all
2477  * scsi commands on the specified device.  Called from interrupt
2478  * or normal process context.
2479  *
2480  * Returns zero if successful or error if not
2481  *
2482  * Notes:
2483  *      This routine transitions the device to the SDEV_BLOCK state
2484  *      (which must be a legal transition).  When the device is in this
2485  *      state, all commands are deferred until the scsi lld reenables
2486  *      the device with scsi_device_unblock or device_block_tmo fires.
2487  */
2488 int
2489 scsi_internal_device_block(struct scsi_device *sdev)
2490 {
2491         struct request_queue *q = sdev->request_queue;
2492         unsigned long flags;
2493         int err = 0;
2494
2495         err = scsi_device_set_state(sdev, SDEV_BLOCK);
2496         if (err) {
2497                 err = scsi_device_set_state(sdev, SDEV_CREATED_BLOCK);
2498
2499                 if (err)
2500                         return err;
2501         }
2502
2503         /*
2504          * The device has transitioned to SDEV_BLOCK.  Stop the
2505          * block layer from calling the midlayer with this device's
2506          * request queue.
2507          */
2508         spin_lock_irqsave(q->queue_lock, flags);
2509         blk_stop_queue(q);
2510         spin_unlock_irqrestore(q->queue_lock, flags);
2511
2512         return 0;
2513 }
2514 EXPORT_SYMBOL_GPL(scsi_internal_device_block);
2515
2516 /**
2517  * scsi_internal_device_unblock - resume a device after a block request
2518  * @sdev:       device to resume
2519  * @new_state:  state to set devices to after unblocking
2520  *
2521  * Called by scsi lld's or the midlayer to restart the device queue
2522  * for the previously suspended scsi device.  Called from interrupt or
2523  * normal process context.
2524  *
2525  * Returns zero if successful or error if not.
2526  *
2527  * Notes:
2528  *      This routine transitions the device to the SDEV_RUNNING state
2529  *      or to one of the offline states (which must be a legal transition)
2530  *      allowing the midlayer to goose the queue for this device.
2531  */
2532 int
2533 scsi_internal_device_unblock(struct scsi_device *sdev,
2534                              enum scsi_device_state new_state)
2535 {
2536         struct request_queue *q = sdev->request_queue;
2537         unsigned long flags;
2538
2539         /*
2540          * Try to transition the scsi device to SDEV_RUNNING or one of the
2541          * offlined states and goose the device queue if successful.
2542          */
2543         if ((sdev->sdev_state == SDEV_BLOCK) ||
2544             (sdev->sdev_state == SDEV_TRANSPORT_OFFLINE))
2545                 sdev->sdev_state = new_state;
2546         else if (sdev->sdev_state == SDEV_CREATED_BLOCK) {
2547                 if (new_state == SDEV_TRANSPORT_OFFLINE ||
2548                     new_state == SDEV_OFFLINE)
2549                         sdev->sdev_state = new_state;
2550                 else
2551                         sdev->sdev_state = SDEV_CREATED;
2552         } else if (sdev->sdev_state != SDEV_CANCEL &&
2553                  sdev->sdev_state != SDEV_OFFLINE)
2554                 return -EINVAL;
2555
2556         spin_lock_irqsave(q->queue_lock, flags);
2557         blk_start_queue(q);
2558         spin_unlock_irqrestore(q->queue_lock, flags);
2559
2560         return 0;
2561 }
2562 EXPORT_SYMBOL_GPL(scsi_internal_device_unblock);
2563
2564 static void
2565 device_block(struct scsi_device *sdev, void *data)
2566 {
2567         scsi_internal_device_block(sdev);
2568 }
2569
2570 static int
2571 target_block(struct device *dev, void *data)
2572 {
2573         if (scsi_is_target_device(dev))
2574                 starget_for_each_device(to_scsi_target(dev), NULL,
2575                                         device_block);
2576         return 0;
2577 }
2578
2579 void
2580 scsi_target_block(struct device *dev)
2581 {
2582         if (scsi_is_target_device(dev))
2583                 starget_for_each_device(to_scsi_target(dev), NULL,
2584                                         device_block);
2585         else
2586                 device_for_each_child(dev, NULL, target_block);
2587 }
2588 EXPORT_SYMBOL_GPL(scsi_target_block);
2589
2590 static void
2591 device_unblock(struct scsi_device *sdev, void *data)
2592 {
2593         scsi_internal_device_unblock(sdev, *(enum scsi_device_state *)data);
2594 }
2595
2596 static int
2597 target_unblock(struct device *dev, void *data)
2598 {
2599         if (scsi_is_target_device(dev))
2600                 starget_for_each_device(to_scsi_target(dev), data,
2601                                         device_unblock);
2602         return 0;
2603 }
2604
2605 void
2606 scsi_target_unblock(struct device *dev, enum scsi_device_state new_state)
2607 {
2608         if (scsi_is_target_device(dev))
2609                 starget_for_each_device(to_scsi_target(dev), &new_state,
2610                                         device_unblock);
2611         else
2612                 device_for_each_child(dev, &new_state, target_unblock);
2613 }
2614 EXPORT_SYMBOL_GPL(scsi_target_unblock);
2615
2616 /**
2617  * scsi_kmap_atomic_sg - find and atomically map an sg-elemnt
2618  * @sgl:        scatter-gather list
2619  * @sg_count:   number of segments in sg
2620  * @offset:     offset in bytes into sg, on return offset into the mapped area
2621  * @len:        bytes to map, on return number of bytes mapped
2622  *
2623  * Returns virtual address of the start of the mapped page
2624  */
2625 void *scsi_kmap_atomic_sg(struct scatterlist *sgl, int sg_count,
2626                           size_t *offset, size_t *len)
2627 {
2628         int i;
2629         size_t sg_len = 0, len_complete = 0;
2630         struct scatterlist *sg;
2631         struct page *page;
2632
2633         WARN_ON(!irqs_disabled());
2634
2635         for_each_sg(sgl, sg, sg_count, i) {
2636                 len_complete = sg_len; /* Complete sg-entries */
2637                 sg_len += sg->length;
2638                 if (sg_len > *offset)
2639                         break;
2640         }
2641
2642         if (unlikely(i == sg_count)) {
2643                 printk(KERN_ERR "%s: Bytes in sg: %zu, requested offset %zu, "
2644                         "elements %d\n",
2645                        __func__, sg_len, *offset, sg_count);
2646                 WARN_ON(1);
2647                 return NULL;
2648         }
2649
2650         /* Offset starting from the beginning of first page in this sg-entry */
2651         *offset = *offset - len_complete + sg->offset;
2652
2653         /* Assumption: contiguous pages can be accessed as "page + i" */
2654         page = nth_page(sg_page(sg), (*offset >> PAGE_SHIFT));
2655         *offset &= ~PAGE_MASK;
2656
2657         /* Bytes in this sg-entry from *offset to the end of the page */
2658         sg_len = PAGE_SIZE - *offset;
2659         if (*len > sg_len)
2660                 *len = sg_len;
2661
2662         return kmap_atomic(page);
2663 }
2664 EXPORT_SYMBOL(scsi_kmap_atomic_sg);
2665
2666 /**
2667  * scsi_kunmap_atomic_sg - atomically unmap a virtual address, previously mapped with scsi_kmap_atomic_sg
2668  * @virt:       virtual address to be unmapped
2669  */
2670 void scsi_kunmap_atomic_sg(void *virt)
2671 {
2672         kunmap_atomic(virt);
2673 }
2674 EXPORT_SYMBOL(scsi_kunmap_atomic_sg);
2675
2676 void sdev_disable_disk_events(struct scsi_device *sdev)
2677 {
2678         atomic_inc(&sdev->disk_events_disable_depth);
2679 }
2680 EXPORT_SYMBOL(sdev_disable_disk_events);
2681
2682 void sdev_enable_disk_events(struct scsi_device *sdev)
2683 {
2684         if (WARN_ON_ONCE(atomic_read(&sdev->disk_events_disable_depth) <= 0))
2685                 return;
2686         atomic_dec(&sdev->disk_events_disable_depth);
2687 }
2688 EXPORT_SYMBOL(sdev_enable_disk_events);