]> git.proxmox.com Git - mirror_ubuntu-bionic-kernel.git/blobdiff - drivers/scsi/hpsa.c
hpsa: use workqueue to resubmit failed ioaccel commands
[mirror_ubuntu-bionic-kernel.git] / drivers / scsi / hpsa.c
index 6bb4611b238a8421813ab761ac1ecaa53a20cd6d..dcacb29ff5899596a524970fccc9ade6d6305135 100644 (file)
@@ -50,6 +50,7 @@
 #include <linux/jiffies.h>
 #include <linux/percpu-defs.h>
 #include <linux/percpu.h>
+#include <asm/unaligned.h>
 #include <asm/div64.h>
 #include "hpsa_cmd.h"
 #include "hpsa.h"
@@ -195,8 +196,6 @@ static int number_of_controllers;
 static irqreturn_t do_hpsa_intr_intx(int irq, void *dev_id);
 static irqreturn_t do_hpsa_intr_msi(int irq, void *dev_id);
 static int hpsa_ioctl(struct scsi_device *dev, int cmd, void __user *arg);
-static void lock_and_start_io(struct ctlr_info *h);
-static void start_io(struct ctlr_info *h, unsigned long *flags);
 
 #ifdef CONFIG_COMPAT
 static int hpsa_compat_ioctl(struct scsi_device *dev, int cmd,
@@ -204,18 +203,18 @@ static int hpsa_compat_ioctl(struct scsi_device *dev, int cmd,
 #endif
 
 static void cmd_free(struct ctlr_info *h, struct CommandList *c);
-static void cmd_special_free(struct ctlr_info *h, struct CommandList *c);
 static struct CommandList *cmd_alloc(struct ctlr_info *h);
-static struct CommandList *cmd_special_alloc(struct ctlr_info *h);
 static int fill_cmd(struct CommandList *c, u8 cmd, struct ctlr_info *h,
        void *buff, size_t size, u16 page_code, unsigned char *scsi3addr,
        int cmd_type);
+static void hpsa_free_cmd_pool(struct ctlr_info *h);
 #define VPD_PAGE (1 << 8)
 
 static int hpsa_scsi_queue_command(struct Scsi_Host *h, struct scsi_cmnd *cmd);
 static void hpsa_scan_start(struct Scsi_Host *);
 static int hpsa_scan_finished(struct Scsi_Host *sh,
        unsigned long elapsed_time);
+static int hpsa_change_queue_depth(struct scsi_device *sdev, int qdepth);
 
 static int hpsa_eh_device_reset_handler(struct scsi_cmnd *scsicmd);
 static int hpsa_eh_abort_handler(struct scsi_cmnd *scsicmd);
@@ -229,7 +228,7 @@ static void check_ioctl_unit_attention(struct ctlr_info *h,
        struct CommandList *c);
 /* performant mode helper functions */
 static void calc_bucket_map(int *bucket, int num_buckets,
-       int nsgs, int min_blocks, int *bucket_map);
+       int nsgs, int min_blocks, u32 *bucket_map);
 static void hpsa_put_ctlr_into_performant_mode(struct ctlr_info *h);
 static inline u32 next_command(struct ctlr_info *h, u8 q);
 static int hpsa_find_cfg_addrs(struct pci_dev *pdev, void __iomem *vaddr,
@@ -249,6 +248,7 @@ static void hpsa_flush_cache(struct ctlr_info *h);
 static int hpsa_scsi_ioaccel_queue_command(struct ctlr_info *h,
        struct CommandList *c, u32 ioaccel_handle, u8 *cdb, int cdb_len,
        u8 *scsi3addr);
+static void hpsa_command_resubmit_worker(struct work_struct *work);
 
 static inline struct ctlr_info *sdev_to_hba(struct scsi_device *sdev)
 {
@@ -505,8 +505,8 @@ static inline int is_logical_dev_addr_mode(unsigned char scsi3addr[])
        return (scsi3addr[3] & 0xC0) == 0x40;
 }
 
-static const char *raid_label[] = { "0", "4", "1(1+0)", "5", "5+1", "ADG",
-       "1(ADM)", "UNKNOWN"
+static const char * const raid_label[] = { "0", "4", "1(+0)", "5", "5+1", "6",
+       "1(+0)ADM", "UNKNOWN"
 };
 #define HPSA_RAID_0    0
 #define HPSA_RAID_4    1
@@ -671,7 +671,7 @@ static struct scsi_host_template hpsa_driver_template = {
        .queuecommand           = hpsa_scsi_queue_command,
        .scan_start             = hpsa_scan_start,
        .scan_finished          = hpsa_scan_finished,
-       .change_queue_depth     = scsi_change_queue_depth,
+       .change_queue_depth     = hpsa_change_queue_depth,
        .this_id                = -1,
        .use_clustering         = ENABLE_CLUSTERING,
        .eh_abort_handler       = hpsa_eh_abort_handler,
@@ -688,13 +688,6 @@ static struct scsi_host_template hpsa_driver_template = {
        .no_write_same = 1,
 };
 
-
-/* Enqueuing and dequeuing functions for cmdlists. */
-static inline void addQ(struct list_head *list, struct CommandList *c)
-{
-       list_add_tail(&c->list, list);
-}
-
 static inline u32 next_command(struct ctlr_info *h, u8 q)
 {
        u32 a;
@@ -828,8 +821,6 @@ static void dial_up_lockup_detection_on_fw_flash_complete(struct ctlr_info *h,
 static void enqueue_cmd_and_start_io(struct ctlr_info *h,
        struct CommandList *c)
 {
-       unsigned long flags;
-
        switch (c->cmd_type) {
        case CMD_IOACCEL1:
                set_ioaccel1_performant_mode(h, c);
@@ -841,18 +832,8 @@ static void enqueue_cmd_and_start_io(struct ctlr_info *h,
                set_performant_mode(h, c);
        }
        dial_down_lockup_detection_during_fw_flash(h, c);
-       spin_lock_irqsave(&h->lock, flags);
-       addQ(&h->reqQ, c);
-       h->Qdepth++;
-       start_io(h, &flags);
-       spin_unlock_irqrestore(&h->lock, flags);
-}
-
-static inline void removeQ(struct CommandList *c)
-{
-       if (WARN_ON(list_empty(&c->list)))
-               return;
-       list_del_init(&c->list);
+       atomic_inc(&h->commands_outstanding);
+       h->access.submit_command(h, c);
 }
 
 static inline int is_hba_lunid(unsigned char scsi3addr[])
@@ -919,7 +900,7 @@ static int hpsa_scsi_add_entry(struct ctlr_info *h, int hostno,
 
        /* If this device a non-zero lun of a multi-lun device
         * byte 4 of the 8-byte LUN addr will contain the logical
-        * unit no, zero otherise.
+        * unit no, zero otherwise.
         */
        if (device->scsi3addr[4] == 0) {
                /* This is not a non-zero lun of a multi-lun device */
@@ -1478,13 +1459,17 @@ static int hpsa_allocate_sg_chain_blocks(struct ctlr_info *h)
 
        h->cmd_sg_list = kzalloc(sizeof(*h->cmd_sg_list) * h->nr_cmds,
                                GFP_KERNEL);
-       if (!h->cmd_sg_list)
+       if (!h->cmd_sg_list) {
+               dev_err(&h->pdev->dev, "Failed to allocate SG list\n");
                return -ENOMEM;
+       }
        for (i = 0; i < h->nr_cmds; i++) {
                h->cmd_sg_list[i] = kmalloc(sizeof(*h->cmd_sg_list[i]) *
                                                h->chainsize, GFP_KERNEL);
-               if (!h->cmd_sg_list[i])
+               if (!h->cmd_sg_list[i]) {
+                       dev_err(&h->pdev->dev, "Failed to allocate cmd SG\n");
                        goto clean;
+               }
        }
        return 0;
 
@@ -1504,7 +1489,7 @@ static int hpsa_map_sg_chain_block(struct ctlr_info *h,
        chain_block = h->cmd_sg_list[c->cmdindex];
        chain_sg->Ext = cpu_to_le32(HPSA_SG_CHAIN);
        chain_len = sizeof(*chain_sg) *
-               (c->Header.SGTotal - h->max_cmd_sg_entries);
+               (le16_to_cpu(c->Header.SGTotal) - h->max_cmd_sg_entries);
        chain_sg->Len = cpu_to_le32(chain_len);
        temp64 = pci_map_single(h->pdev, chain_block, chain_len,
                                PCI_DMA_TODEVICE);
@@ -1635,7 +1620,6 @@ static void process_ioaccel2_completion(struct ctlr_info *h,
                struct hpsa_scsi_dev_t *dev)
 {
        struct io_accel2_cmd *c2 = &h->ioaccel2_cmd_pool[c->cmdindex];
-       int raid_retry = 0;
 
        /* check for good status */
        if (likely(c2->error_data.serv_response == 0 &&
@@ -1652,26 +1636,22 @@ static void process_ioaccel2_completion(struct ctlr_info *h,
        if (is_logical_dev_addr_mode(dev->scsi3addr) &&
                c2->error_data.serv_response ==
                        IOACCEL2_SERV_RESPONSE_FAILURE) {
-               dev->offload_enabled = 0;
-               h->drv_req_rescan = 1;  /* schedule controller for a rescan */
-               cmd->result = DID_SOFT_ERROR << 16;
-               cmd_free(h, c);
-               cmd->scsi_done(cmd);
-               return;
-       }
-       raid_retry = handle_ioaccel_mode2_error(h, c, cmd, c2);
-       /* If error found, disable Smart Path, schedule a rescan,
-        * and force a retry on the standard path.
-        */
-       if (raid_retry) {
-               dev_warn(&h->pdev->dev, "%s: Retrying on standard path.\n",
-                       "HP SSD Smart Path");
-               dev->offload_enabled = 0; /* Disable Smart Path */
-               h->drv_req_rescan = 1;    /* schedule controller rescan */
-               cmd->result = DID_SOFT_ERROR << 16;
+               if (c2->error_data.status ==
+                       IOACCEL2_STATUS_SR_IOACCEL_DISABLED)
+                       dev->offload_enabled = 0;
+               goto retry_cmd;
        }
+
+       if (handle_ioaccel_mode2_error(h, c, cmd, c2))
+               goto retry_cmd;
+
        cmd_free(h, c);
        cmd->scsi_done(cmd);
+       return;
+
+retry_cmd:
+       INIT_WORK(&c->work, hpsa_command_resubmit_worker);
+       queue_work_on(raw_smp_processor_id(), h->resubmit_wq, &c->work);
 }
 
 static void complete_scsi_command(struct CommandList *cp)
@@ -1693,7 +1673,7 @@ static void complete_scsi_command(struct CommandList *cp)
 
        scsi_dma_unmap(cmd); /* undo the DMA mappings */
        if ((cp->cmd_type == CMD_SCSI) &&
-               (cp->Header.SGTotal > h->max_cmd_sg_entries))
+               (le16_to_cpu(cp->Header.SGTotal) > h->max_cmd_sg_entries))
                hpsa_unmap_sg_chain_block(h, cp);
 
        cmd->result = (DID_OK << 16);           /* host byte */
@@ -1726,8 +1706,10 @@ static void complete_scsi_command(struct CommandList *cp)
         */
        if (cp->cmd_type == CMD_IOACCEL1) {
                struct io_accel1_cmd *c = &h->ioaccel_cmd_pool[cp->cmdindex];
-               cp->Header.SGList = cp->Header.SGTotal = scsi_sg_count(cmd);
-               cp->Request.CDBLen = c->io_flags & IOACCEL1_IOFLAGS_CDBLEN_MASK;
+               cp->Header.SGList = scsi_sg_count(cmd);
+               cp->Header.SGTotal = cpu_to_le16(cp->Header.SGList);
+               cp->Request.CDBLen = le16_to_cpu(c->io_flags) &
+                       IOACCEL1_IOFLAGS_CDBLEN_MASK;
                cp->Header.tag = c->tag;
                memcpy(cp->Header.LUN.LunAddrBytes, c->CISS_LUN, 8);
                memcpy(cp->Request.CDB, c->CDB, cp->Request.CDBLen);
@@ -1739,9 +1721,9 @@ static void complete_scsi_command(struct CommandList *cp)
                if (is_logical_dev_addr_mode(dev->scsi3addr)) {
                        if (ei->CommandStatus == CMD_IOACCEL_DISABLED)
                                dev->offload_enabled = 0;
-                       cmd->result = DID_SOFT_ERROR << 16;
-                       cmd_free(h, cp);
-                       cmd->scsi_done(cmd);
+                       INIT_WORK(&cp->work, hpsa_command_resubmit_worker);
+                       queue_work_on(raw_smp_processor_id(),
+                                       h->resubmit_wq, &cp->work);
                        return;
                }
        }
@@ -2048,10 +2030,10 @@ static int hpsa_scsi_do_inquiry(struct ctlr_info *h, unsigned char *scsi3addr,
        struct CommandList *c;
        struct ErrorInfo *ei;
 
-       c = cmd_special_alloc(h);
+       c = cmd_alloc(h);
 
-       if (c == NULL) {                        /* trouble... */
-               dev_warn(&h->pdev->dev, "cmd_special_alloc returned NULL!\n");
+       if (c == NULL) {
+               dev_warn(&h->pdev->dev, "cmd_alloc returned NULL!\n");
                return -ENOMEM;
        }
 
@@ -2067,7 +2049,7 @@ static int hpsa_scsi_do_inquiry(struct ctlr_info *h, unsigned char *scsi3addr,
                rc = -1;
        }
 out:
-       cmd_special_free(h, c);
+       cmd_free(h, c);
        return rc;
 }
 
@@ -2079,10 +2061,9 @@ static int hpsa_bmic_ctrl_mode_sense(struct ctlr_info *h,
        struct CommandList *c;
        struct ErrorInfo *ei;
 
-       c = cmd_special_alloc(h);
-
+       c = cmd_alloc(h);
        if (c == NULL) {                        /* trouble... */
-               dev_warn(&h->pdev->dev, "cmd_special_alloc returned NULL!\n");
+               dev_warn(&h->pdev->dev, "cmd_alloc returned NULL!\n");
                return -ENOMEM;
        }
 
@@ -2098,7 +2079,7 @@ static int hpsa_bmic_ctrl_mode_sense(struct ctlr_info *h,
                rc = -1;
        }
 out:
-       cmd_special_free(h, c);
+       cmd_free(h, c);
        return rc;
        }
 
@@ -2109,10 +2090,10 @@ static int hpsa_send_reset(struct ctlr_info *h, unsigned char *scsi3addr,
        struct CommandList *c;
        struct ErrorInfo *ei;
 
-       c = cmd_special_alloc(h);
+       c = cmd_alloc(h);
 
        if (c == NULL) {                        /* trouble... */
-               dev_warn(&h->pdev->dev, "cmd_special_alloc returned NULL!\n");
+               dev_warn(&h->pdev->dev, "cmd_alloc returned NULL!\n");
                return -ENOMEM;
        }
 
@@ -2128,7 +2109,7 @@ static int hpsa_send_reset(struct ctlr_info *h, unsigned char *scsi3addr,
                hpsa_scsi_interpret_error(h, c);
                rc = -1;
        }
-       cmd_special_free(h, c);
+       cmd_free(h, c);
        return rc;
 }
 
@@ -2191,15 +2172,13 @@ static void hpsa_debug_map_buff(struct ctlr_info *h, int rc,
                        le16_to_cpu(map_buff->row_cnt));
        dev_info(&h->pdev->dev, "layout_map_count = %u\n",
                        le16_to_cpu(map_buff->layout_map_count));
-       dev_info(&h->pdev->dev, "flags = %u\n",
+       dev_info(&h->pdev->dev, "flags = 0x%x\n",
                        le16_to_cpu(map_buff->flags));
-       if (map_buff->flags & RAID_MAP_FLAG_ENCRYPT_ON)
-               dev_info(&h->pdev->dev, "encrypytion = ON\n");
-       else
-               dev_info(&h->pdev->dev, "encrypytion = OFF\n");
+       dev_info(&h->pdev->dev, "encrypytion = %s\n",
+                       le16_to_cpu(map_buff->flags) &
+                       RAID_MAP_FLAG_ENCRYPT_ON ?  "ON" : "OFF");
        dev_info(&h->pdev->dev, "dekindex = %u\n",
                        le16_to_cpu(map_buff->dekindex));
-
        map_cnt = le16_to_cpu(map_buff->layout_map_count);
        for (map = 0; map < map_cnt; map++) {
                dev_info(&h->pdev->dev, "Map%u:\n", map);
@@ -2238,26 +2217,26 @@ static int hpsa_get_raid_map(struct ctlr_info *h,
        struct CommandList *c;
        struct ErrorInfo *ei;
 
-       c = cmd_special_alloc(h);
+       c = cmd_alloc(h);
        if (c == NULL) {
-               dev_warn(&h->pdev->dev, "cmd_special_alloc returned NULL!\n");
+               dev_warn(&h->pdev->dev, "cmd_alloc returned NULL!\n");
                return -ENOMEM;
        }
        if (fill_cmd(c, HPSA_GET_RAID_MAP, h, &this_device->raid_map,
                        sizeof(this_device->raid_map), 0,
                        scsi3addr, TYPE_CMD)) {
                dev_warn(&h->pdev->dev, "Out of memory in hpsa_get_raid_map()\n");
-               cmd_special_free(h, c);
+               cmd_free(h, c);
                return -ENOMEM;
        }
        hpsa_scsi_do_simple_cmd_with_retry(h, c, PCI_DMA_FROMDEVICE);
        ei = c->err_info;
        if (ei->CommandStatus != 0 && ei->CommandStatus != CMD_DATA_UNDERRUN) {
                hpsa_scsi_interpret_error(h, c);
-               cmd_special_free(h, c);
+               cmd_free(h, c);
                return -1;
        }
-       cmd_special_free(h, c);
+       cmd_free(h, c);
 
        /* @todo in the future, dynamically allocate RAID map memory */
        if (le32_to_cpu(this_device->raid_map.structure_size) >
@@ -2377,9 +2356,9 @@ static int hpsa_scsi_do_report_luns(struct ctlr_info *h, int logical,
        unsigned char scsi3addr[8];
        struct ErrorInfo *ei;
 
-       c = cmd_special_alloc(h);
+       c = cmd_alloc(h);
        if (c == NULL) {                        /* trouble... */
-               dev_err(&h->pdev->dev, "cmd_special_alloc returned NULL!\n");
+               dev_err(&h->pdev->dev, "cmd_alloc returned NULL!\n");
                return -1;
        }
        /* address the controller */
@@ -2407,7 +2386,7 @@ static int hpsa_scsi_do_report_luns(struct ctlr_info *h, int logical,
                }
        }
 out:
-       cmd_special_free(h, c);
+       cmd_free(h, c);
        return rc;
 }
 
@@ -2741,8 +2720,8 @@ static int hpsa_get_pdisk_of_ioaccel2(struct ctlr_info *h,
        struct scsi_cmnd *scmd; /* scsi command within request being aborted */
        struct hpsa_scsi_dev_t *d; /* device of request being aborted */
        struct io_accel2_cmd *c2a; /* ioaccel2 command to abort */
-       u32 it_nexus;           /* 4 byte device handle for the ioaccel2 cmd */
-       u32 scsi_nexus;         /* 4 byte device handle for the ioaccel2 cmd */
+       __le32 it_nexus;        /* 4 byte device handle for the ioaccel2 cmd */
+       __le32 scsi_nexus;      /* 4 byte device handle for the ioaccel2 cmd */
 
        if (ioaccel2_cmd_to_abort->cmd_type != CMD_IOACCEL2)
                return 0; /* no match */
@@ -2761,8 +2740,8 @@ static int hpsa_get_pdisk_of_ioaccel2(struct ctlr_info *h,
                return 0; /* no match */
 
        it_nexus = cpu_to_le32(d->ioaccel_handle);
-       scsi_nexus = cpu_to_le32(c2a->scsi_nexus);
-       find = c2a->scsi_nexus;
+       scsi_nexus = c2a->scsi_nexus;
+       find = le32_to_cpu(c2a->scsi_nexus);
 
        if (h->raid_offload_debug > 0)
                dev_info(&h->pdev->dev,
@@ -3105,7 +3084,8 @@ out:
        kfree(logdev_list);
 }
 
-/* hpsa_scatter_gather takes a struct scsi_cmnd, (cmd), and does the pci
+/*
+ * hpsa_scatter_gather takes a struct scsi_cmnd, (cmd), and does the pci
  * dma mapping  and fills in the scatter gather entries of the
  * hpsa command, cp.
  */
@@ -3163,7 +3143,7 @@ static int hpsa_scatter_gather(struct ctlr_info *h,
 sglist_finished:
 
        cp->Header.SGList = (u8) use_sg;   /* no. SGs contig in this cmd */
-       cp->Header.SGTotal = cpu_to_le16(use_sg); /* total sgs in this cmd list */
+       cp->Header.SGTotal = cpu_to_le16(use_sg); /* total sgs in cmd list */
        return 0;
 }
 
@@ -3284,11 +3264,11 @@ static int hpsa_scsi_ioaccel1_queue_command(struct ctlr_info *h,
 
        c->Header.SGList = use_sg;
        /* Fill out the command structure to submit */
-       cp->dev_handle = ioaccel_handle & 0xFFFF;
-       cp->transfer_len = total_len;
-       cp->io_flags = IOACCEL1_IOFLAGS_IO_REQ |
-                       (cdb_len & IOACCEL1_IOFLAGS_CDBLEN_MASK);
-       cp->control = control;
+       cp->dev_handle = cpu_to_le16(ioaccel_handle & 0xFFFF);
+       cp->transfer_len = cpu_to_le32(total_len);
+       cp->io_flags = cpu_to_le16(IOACCEL1_IOFLAGS_IO_REQ |
+                       (cdb_len & IOACCEL1_IOFLAGS_CDBLEN_MASK));
+       cp->control = cpu_to_le32(control);
        memcpy(cp->CDB, cdb, cdb_len);
        memcpy(cp->CISS_LUN, scsi3addr, 8);
        /* Tag was already set at init time. */
@@ -3324,7 +3304,7 @@ static void set_encrypt_ioaccel2(struct ctlr_info *h,
        BUG_ON(!(dev->offload_config && dev->offload_enabled));
 
        /* Are we doing encryption on this device */
-       if (!(map->flags & RAID_MAP_FLAG_ENCRYPT_ON))
+       if (!(le16_to_cpu(map->flags) & RAID_MAP_FLAG_ENCRYPT_ON))
                return;
        /* Set the data encryption key index. */
        cp->dekindex = map->dekindex;
@@ -3340,96 +3320,33 @@ static void set_encrypt_ioaccel2(struct ctlr_info *h,
        /* Required? 6-byte cdbs eliminated by fixup_ioaccel_cdb */
        case WRITE_6:
        case READ_6:
-               if (map->volume_blk_size == 512) {
-                       cp->tweak_lower =
-                               (((u32) cmd->cmnd[2]) << 8) |
-                                       cmd->cmnd[3];
-                       cp->tweak_upper = 0;
-               } else {
-                       first_block =
-                               (((u64) cmd->cmnd[2]) << 8) |
-                                       cmd->cmnd[3];
-                       first_block = (first_block * map->volume_blk_size)/512;
-                       cp->tweak_lower = (u32)first_block;
-                       cp->tweak_upper = (u32)(first_block >> 32);
-               }
+               first_block = get_unaligned_be16(&cmd->cmnd[2]);
                break;
        case WRITE_10:
        case READ_10:
-               if (map->volume_blk_size == 512) {
-                       cp->tweak_lower =
-                               (((u32) cmd->cmnd[2]) << 24) |
-                               (((u32) cmd->cmnd[3]) << 16) |
-                               (((u32) cmd->cmnd[4]) << 8) |
-                                       cmd->cmnd[5];
-                       cp->tweak_upper = 0;
-               } else {
-                       first_block =
-                               (((u64) cmd->cmnd[2]) << 24) |
-                               (((u64) cmd->cmnd[3]) << 16) |
-                               (((u64) cmd->cmnd[4]) << 8) |
-                                       cmd->cmnd[5];
-                       first_block = (first_block * map->volume_blk_size)/512;
-                       cp->tweak_lower = (u32)first_block;
-                       cp->tweak_upper = (u32)(first_block >> 32);
-               }
-               break;
        /* Required? 12-byte cdbs eliminated by fixup_ioaccel_cdb */
        case WRITE_12:
        case READ_12:
-               if (map->volume_blk_size == 512) {
-                       cp->tweak_lower =
-                               (((u32) cmd->cmnd[2]) << 24) |
-                               (((u32) cmd->cmnd[3]) << 16) |
-                               (((u32) cmd->cmnd[4]) << 8) |
-                                       cmd->cmnd[5];
-                       cp->tweak_upper = 0;
-               } else {
-                       first_block =
-                               (((u64) cmd->cmnd[2]) << 24) |
-                               (((u64) cmd->cmnd[3]) << 16) |
-                               (((u64) cmd->cmnd[4]) << 8) |
-                                       cmd->cmnd[5];
-                       first_block = (first_block * map->volume_blk_size)/512;
-                       cp->tweak_lower = (u32)first_block;
-                       cp->tweak_upper = (u32)(first_block >> 32);
-               }
+               first_block = get_unaligned_be32(&cmd->cmnd[2]);
                break;
        case WRITE_16:
        case READ_16:
-               if (map->volume_blk_size == 512) {
-                       cp->tweak_lower =
-                               (((u32) cmd->cmnd[6]) << 24) |
-                               (((u32) cmd->cmnd[7]) << 16) |
-                               (((u32) cmd->cmnd[8]) << 8) |
-                                       cmd->cmnd[9];
-                       cp->tweak_upper =
-                               (((u32) cmd->cmnd[2]) << 24) |
-                               (((u32) cmd->cmnd[3]) << 16) |
-                               (((u32) cmd->cmnd[4]) << 8) |
-                                       cmd->cmnd[5];
-               } else {
-                       first_block =
-                               (((u64) cmd->cmnd[2]) << 56) |
-                               (((u64) cmd->cmnd[3]) << 48) |
-                               (((u64) cmd->cmnd[4]) << 40) |
-                               (((u64) cmd->cmnd[5]) << 32) |
-                               (((u64) cmd->cmnd[6]) << 24) |
-                               (((u64) cmd->cmnd[7]) << 16) |
-                               (((u64) cmd->cmnd[8]) << 8) |
-                                       cmd->cmnd[9];
-                       first_block = (first_block * map->volume_blk_size)/512;
-                       cp->tweak_lower = (u32)first_block;
-                       cp->tweak_upper = (u32)(first_block >> 32);
-               }
+               first_block = get_unaligned_be64(&cmd->cmnd[2]);
                break;
        default:
                dev_err(&h->pdev->dev,
-                       "ERROR: %s: IOACCEL request CDB size not supported for encryption\n",
-                       __func__);
+                       "ERROR: %s: size (0x%x) not supported for encryption\n",
+                       __func__, cmd->cmnd[0]);
                BUG();
                break;
        }
+
+       if (le32_to_cpu(map->volume_blk_size) != 512)
+               first_block = first_block *
+                               le32_to_cpu(map->volume_blk_size)/512;
+
+       cp->tweak_lower = cpu_to_le32(first_block);
+       cp->tweak_upper = cpu_to_le32(first_block >> 32);
 }
 
 static int hpsa_scsi_ioaccel2_queue_command(struct ctlr_info *h,
@@ -3506,9 +3423,8 @@ static int hpsa_scsi_ioaccel2_queue_command(struct ctlr_info *h,
        /* Set encryption parameters, if necessary */
        set_encrypt_ioaccel2(h, c, cp);
 
-       cp->scsi_nexus = ioaccel_handle;
-       cp->Tag = (c->cmdindex << DIRECT_LOOKUP_SHIFT) |
-                               DIRECT_LOOKUP_BIT;
+       cp->scsi_nexus = cpu_to_le32(ioaccel_handle);
+       cp->Tag = cpu_to_le32(c->cmdindex << DIRECT_LOOKUP_SHIFT);
        memcpy(cp->cdb, cdb, sizeof(cp->cdb));
 
        /* fill in sg elements */
@@ -3543,21 +3459,22 @@ static void raid_map_helper(struct raid_map_data *map,
 {
        if (offload_to_mirror == 0)  {
                /* use physical disk in the first mirrored group. */
-               *map_index %= map->data_disks_per_row;
+               *map_index %= le16_to_cpu(map->data_disks_per_row);
                return;
        }
        do {
                /* determine mirror group that *map_index indicates */
-               *current_group = *map_index / map->data_disks_per_row;
+               *current_group = *map_index /
+                       le16_to_cpu(map->data_disks_per_row);
                if (offload_to_mirror == *current_group)
                        continue;
-               if (*current_group < (map->layout_map_count - 1)) {
+               if (*current_group < le16_to_cpu(map->layout_map_count) - 1) {
                        /* select map index from next group */
-                       *map_index += map->data_disks_per_row;
+                       *map_index += le16_to_cpu(map->data_disks_per_row);
                        (*current_group)++;
                } else {
                        /* select map index from first group */
-                       *map_index %= map->data_disks_per_row;
+                       *map_index %= le16_to_cpu(map->data_disks_per_row);
                        *current_group = 0;
                }
        } while (offload_to_mirror != *current_group);
@@ -3595,6 +3512,7 @@ static int hpsa_scsi_ioaccel_raid_map(struct ctlr_info *h,
        u32 disk_block_cnt;
        u8 cdb[16];
        u8 cdb_len;
+       u16 strip_size;
 #if BITS_PER_LONG == 32
        u64 tmpdiv;
 #endif
@@ -3668,11 +3586,14 @@ static int hpsa_scsi_ioaccel_raid_map(struct ctlr_info *h,
                return IO_ACCEL_INELIGIBLE;
 
        /* check for invalid block or wraparound */
-       if (last_block >= map->volume_blk_cnt || last_block < first_block)
+       if (last_block >= le64_to_cpu(map->volume_blk_cnt) ||
+               last_block < first_block)
                return IO_ACCEL_INELIGIBLE;
 
        /* calculate stripe information for the request */
-       blocks_per_row = map->data_disks_per_row * map->strip_size;
+       blocks_per_row = le16_to_cpu(map->data_disks_per_row) *
+                               le16_to_cpu(map->strip_size);
+       strip_size = le16_to_cpu(map->strip_size);
 #if BITS_PER_LONG == 32
        tmpdiv = first_block;
        (void) do_div(tmpdiv, blocks_per_row);
@@ -3683,18 +3604,18 @@ static int hpsa_scsi_ioaccel_raid_map(struct ctlr_info *h,
        first_row_offset = (u32) (first_block - (first_row * blocks_per_row));
        last_row_offset = (u32) (last_block - (last_row * blocks_per_row));
        tmpdiv = first_row_offset;
-       (void) do_div(tmpdiv,  map->strip_size);
+       (void) do_div(tmpdiv, strip_size);
        first_column = tmpdiv;
        tmpdiv = last_row_offset;
-       (void) do_div(tmpdiv, map->strip_size);
+       (void) do_div(tmpdiv, strip_size);
        last_column = tmpdiv;
 #else
        first_row = first_block / blocks_per_row;
        last_row = last_block / blocks_per_row;
        first_row_offset = (u32) (first_block - (first_row * blocks_per_row));
        last_row_offset = (u32) (last_block - (last_row * blocks_per_row));
-       first_column = first_row_offset / map->strip_size;
-       last_column = last_row_offset / map->strip_size;
+       first_column = first_row_offset / strip_size;
+       last_column = last_row_offset / strip_size;
 #endif
 
        /* if this isn't a single row/column then give to the controller */
@@ -3702,10 +3623,10 @@ static int hpsa_scsi_ioaccel_raid_map(struct ctlr_info *h,
                return IO_ACCEL_INELIGIBLE;
 
        /* proceeding with driver mapping */
-       total_disks_per_row = map->data_disks_per_row +
-                               map->metadata_disks_per_row;
+       total_disks_per_row = le16_to_cpu(map->data_disks_per_row) +
+                               le16_to_cpu(map->metadata_disks_per_row);
        map_row = ((u32)(first_row >> map->parity_rotation_shift)) %
-                               map->row_cnt;
+                               le16_to_cpu(map->row_cnt);
        map_index = (map_row * total_disks_per_row) + first_column;
 
        switch (dev->raid_level) {
@@ -3716,23 +3637,24 @@ static int hpsa_scsi_ioaccel_raid_map(struct ctlr_info *h,
                 * (2-drive R1 and R10 with even # of drives.)
                 * Appropriate for SSDs, not optimal for HDDs
                 */
-               BUG_ON(map->layout_map_count != 2);
+               BUG_ON(le16_to_cpu(map->layout_map_count) != 2);
                if (dev->offload_to_mirror)
-                       map_index += map->data_disks_per_row;
+                       map_index += le16_to_cpu(map->data_disks_per_row);
                dev->offload_to_mirror = !dev->offload_to_mirror;
                break;
        case HPSA_RAID_ADM:
                /* Handles N-way mirrors  (R1-ADM)
                 * and R10 with # of drives divisible by 3.)
                 */
-               BUG_ON(map->layout_map_count != 3);
+               BUG_ON(le16_to_cpu(map->layout_map_count) != 3);
 
                offload_to_mirror = dev->offload_to_mirror;
                raid_map_helper(map, offload_to_mirror,
                                &map_index, &current_group);
                /* set mirror group to use next time */
                offload_to_mirror =
-                       (offload_to_mirror >= map->layout_map_count - 1)
+                       (offload_to_mirror >=
+                       le16_to_cpu(map->layout_map_count) - 1)
                        ? 0 : offload_to_mirror + 1;
                dev->offload_to_mirror = offload_to_mirror;
                /* Avoid direct use of dev->offload_to_mirror within this
@@ -3742,14 +3664,16 @@ static int hpsa_scsi_ioaccel_raid_map(struct ctlr_info *h,
                break;
        case HPSA_RAID_5:
        case HPSA_RAID_6:
-               if (map->layout_map_count <= 1)
+               if (le16_to_cpu(map->layout_map_count) <= 1)
                        break;
 
                /* Verify first and last block are in same RAID group */
                r5or6_blocks_per_row =
-                       map->strip_size * map->data_disks_per_row;
+                       le16_to_cpu(map->strip_size) *
+                       le16_to_cpu(map->data_disks_per_row);
                BUG_ON(r5or6_blocks_per_row == 0);
-               stripesize = r5or6_blocks_per_row * map->layout_map_count;
+               stripesize = r5or6_blocks_per_row *
+                       le16_to_cpu(map->layout_map_count);
 #if BITS_PER_LONG == 32
                tmpdiv = first_block;
                first_group = do_div(tmpdiv, stripesize);
@@ -3812,19 +3736,19 @@ static int hpsa_scsi_ioaccel_raid_map(struct ctlr_info *h,
                                                r5or6_blocks_per_row);
 
                first_column = r5or6_first_column =
-                       r5or6_first_row_offset / map->strip_size;
+                       r5or6_first_row_offset / le16_to_cpu(map->strip_size);
                r5or6_last_column =
-                       r5or6_last_row_offset / map->strip_size;
+                       r5or6_last_row_offset / le16_to_cpu(map->strip_size);
 #endif
                if (r5or6_first_column != r5or6_last_column)
                        return IO_ACCEL_INELIGIBLE;
 
                /* Request is eligible */
                map_row = ((u32)(first_row >> map->parity_rotation_shift)) %
-                       map->row_cnt;
+                       le16_to_cpu(map->row_cnt);
 
                map_index = (first_group *
-                       (map->row_cnt * total_disks_per_row)) +
+                       (le16_to_cpu(map->row_cnt) * total_disks_per_row)) +
                        (map_row * total_disks_per_row) + first_column;
                break;
        default:
@@ -3832,8 +3756,10 @@ static int hpsa_scsi_ioaccel_raid_map(struct ctlr_info *h,
        }
 
        disk_handle = dd[map_index].ioaccel_handle;
-       disk_block = map->disk_starting_blk + (first_row * map->strip_size) +
-                       (first_row_offset - (first_column * map->strip_size));
+       disk_block = le64_to_cpu(map->disk_starting_blk) +
+                       first_row * le16_to_cpu(map->strip_size) +
+                       (first_row_offset - first_column *
+                       le16_to_cpu(map->strip_size));
        disk_block_cnt = block_cnt;
 
        /* handle differing logical/physical block sizes */
@@ -3879,75 +3805,17 @@ static int hpsa_scsi_ioaccel_raid_map(struct ctlr_info *h,
                                                dev->scsi3addr);
 }
 
-/*
- * Running in struct Scsi_Host->host_lock less mode using LLD internal
- * struct ctlr_info *h->lock w/ spin_lock_irqsave() protection.
- */
-static int hpsa_scsi_queue_command(struct Scsi_Host *sh, struct scsi_cmnd *cmd)
+/* Submit commands down the "normal" RAID stack path */
+static int hpsa_ciss_submit(struct ctlr_info *h,
+       struct CommandList *c, struct scsi_cmnd *cmd,
+       unsigned char scsi3addr[])
 {
-       struct ctlr_info *h;
-       struct hpsa_scsi_dev_t *dev;
-       unsigned char scsi3addr[8];
-       struct CommandList *c;
-       int rc = 0;
-
-       /* Get the ptr to our adapter structure out of cmd->host. */
-       h = sdev_to_hba(cmd->device);
-       dev = cmd->device->hostdata;
-       if (!dev) {
-               cmd->result = DID_NO_CONNECT << 16;
-               cmd->scsi_done(cmd);
-               return 0;
-       }
-       memcpy(scsi3addr, dev->scsi3addr, sizeof(scsi3addr));
-
-       if (unlikely(lockup_detected(h))) {
-               cmd->result = DID_ERROR << 16;
-               cmd->scsi_done(cmd);
-               return 0;
-       }
-       c = cmd_alloc(h);
-       if (c == NULL) {                        /* trouble... */
-               dev_err(&h->pdev->dev, "cmd_alloc returned NULL!\n");
-               return SCSI_MLQUEUE_HOST_BUSY;
-       }
-
-       /* Fill in the command list header */
-       /* save c in case we have to abort it  */
        cmd->host_scribble = (unsigned char *) c;
-
        c->cmd_type = CMD_SCSI;
        c->scsi_cmd = cmd;
-
-       /* Call alternate submit routine for I/O accelerated commands.
-        * Retries always go down the normal I/O path.
-        */
-       if (likely(cmd->retries == 0 &&
-               cmd->request->cmd_type == REQ_TYPE_FS &&
-               h->acciopath_status)) {
-               if (dev->offload_enabled) {
-                       rc = hpsa_scsi_ioaccel_raid_map(h, c);
-                       if (rc == 0)
-                               return 0; /* Sent on ioaccel path */
-                       if (rc < 0) {   /* scsi_dma_map failed. */
-                               cmd_free(h, c);
-                               return SCSI_MLQUEUE_HOST_BUSY;
-                       }
-               } else if (dev->ioaccel_handle) {
-                       rc = hpsa_scsi_ioaccel_direct_map(h, c);
-                       if (rc == 0)
-                               return 0; /* Sent on direct map path */
-                       if (rc < 0) {   /* scsi_dma_map failed. */
-                               cmd_free(h, c);
-                               return SCSI_MLQUEUE_HOST_BUSY;
-                       }
-               }
-       }
-
        c->Header.ReplyQueue = 0;  /* unused in simple mode */
        memcpy(&c->Header.LUN.LunAddrBytes[0], &scsi3addr[0], 8);
-       c->Header.tag = cpu_to_le64((c->cmdindex << DIRECT_LOOKUP_SHIFT) |
-                                       DIRECT_LOOKUP_BIT);
+       c->Header.tag = cpu_to_le64((c->cmdindex << DIRECT_LOOKUP_SHIFT));
 
        /* Fill in the request block... */
 
@@ -4003,6 +3871,93 @@ static int hpsa_scsi_queue_command(struct Scsi_Host *sh, struct scsi_cmnd *cmd)
        return 0;
 }
 
+static void hpsa_command_resubmit_worker(struct work_struct *work)
+{
+       struct scsi_cmnd *cmd;
+       struct hpsa_scsi_dev_t *dev;
+       struct CommandList *c =
+                       container_of(work, struct CommandList, work);
+
+       cmd = c->scsi_cmd;
+       dev = cmd->device->hostdata;
+       if (!dev) {
+               cmd->result = DID_NO_CONNECT << 16;
+               cmd->scsi_done(cmd);
+               return;
+       }
+       if (hpsa_ciss_submit(c->h, c, cmd, dev->scsi3addr)) {
+               /*
+                * If we get here, it means dma mapping failed. Try
+                * again via scsi mid layer, which will then get
+                * SCSI_MLQUEUE_HOST_BUSY.
+                */
+               cmd->result = DID_IMM_RETRY << 16;
+               cmd->scsi_done(cmd);
+       }
+}
+
+/* Running in struct Scsi_Host->host_lock less mode */
+static int hpsa_scsi_queue_command(struct Scsi_Host *sh, struct scsi_cmnd *cmd)
+{
+       struct ctlr_info *h;
+       struct hpsa_scsi_dev_t *dev;
+       unsigned char scsi3addr[8];
+       struct CommandList *c;
+       int rc = 0;
+
+       /* Get the ptr to our adapter structure out of cmd->host. */
+       h = sdev_to_hba(cmd->device);
+       dev = cmd->device->hostdata;
+       if (!dev) {
+               cmd->result = DID_NO_CONNECT << 16;
+               cmd->scsi_done(cmd);
+               return 0;
+       }
+       memcpy(scsi3addr, dev->scsi3addr, sizeof(scsi3addr));
+
+       if (unlikely(lockup_detected(h))) {
+               cmd->result = DID_ERROR << 16;
+               cmd->scsi_done(cmd);
+               return 0;
+       }
+       c = cmd_alloc(h);
+       if (c == NULL) {                        /* trouble... */
+               dev_err(&h->pdev->dev, "cmd_alloc returned NULL!\n");
+               return SCSI_MLQUEUE_HOST_BUSY;
+       }
+
+       /* Call alternate submit routine for I/O accelerated commands.
+        * Retries always go down the normal I/O path.
+        */
+       if (likely(cmd->retries == 0 &&
+               cmd->request->cmd_type == REQ_TYPE_FS &&
+               h->acciopath_status)) {
+
+               cmd->host_scribble = (unsigned char *) c;
+               c->cmd_type = CMD_SCSI;
+               c->scsi_cmd = cmd;
+
+               if (dev->offload_enabled) {
+                       rc = hpsa_scsi_ioaccel_raid_map(h, c);
+                       if (rc == 0)
+                               return 0; /* Sent on ioaccel path */
+                       if (rc < 0) {   /* scsi_dma_map failed. */
+                               cmd_free(h, c);
+                               return SCSI_MLQUEUE_HOST_BUSY;
+                       }
+               } else if (dev->ioaccel_handle) {
+                       rc = hpsa_scsi_ioaccel_direct_map(h, c);
+                       if (rc == 0)
+                               return 0; /* Sent on direct map path */
+                       if (rc < 0) {   /* scsi_dma_map failed. */
+                               cmd_free(h, c);
+                               return SCSI_MLQUEUE_HOST_BUSY;
+                       }
+               }
+       }
+       return hpsa_ciss_submit(h, c, cmd, scsi3addr);
+}
+
 static int do_not_scan_if_controller_locked_up(struct ctlr_info *h)
 {
        unsigned long flags;
@@ -4059,6 +4014,19 @@ static void hpsa_scan_start(struct Scsi_Host *sh)
        spin_unlock_irqrestore(&h->scan_lock, flags);
 }
 
+static int hpsa_change_queue_depth(struct scsi_device *sdev, int qdepth)
+{
+       struct ctlr_info *h = sdev_to_hba(sdev);
+
+       if (qdepth < 1)
+               qdepth = 1;
+       else
+               if (qdepth > h->nr_cmds)
+                       qdepth = h->nr_cmds;
+       scsi_change_queue_depth(sdev, qdepth);
+       return sdev->queue_depth;
+}
+
 static int hpsa_scan_finished(struct Scsi_Host *sh,
        unsigned long elapsed_time)
 {
@@ -4096,11 +4064,14 @@ static int hpsa_register_scsi(struct ctlr_info *h)
        sh->max_cmd_len = MAX_COMMAND_SIZE;
        sh->max_lun = HPSA_MAX_LUN;
        sh->max_id = HPSA_MAX_LUN;
-       sh->can_queue = h->nr_cmds;
+       sh->can_queue = h->nr_cmds -
+                       HPSA_CMDS_RESERVED_FOR_ABORTS -
+                       HPSA_CMDS_RESERVED_FOR_DRIVER -
+                       HPSA_MAX_CONCURRENT_PASSTHRUS;
        if (h->hba_mode_enabled)
                sh->cmd_per_lun = 7;
        else
-               sh->cmd_per_lun = h->nr_cmds;
+               sh->cmd_per_lun = sh->can_queue;
        sh->sg_tablesize = h->maxsgentries;
        h->scsi_host = sh;
        sh->hostdata[0] = (unsigned long) h;
@@ -4131,7 +4102,7 @@ static int wait_for_device_to_become_ready(struct ctlr_info *h,
        int waittime = 1; /* seconds */
        struct CommandList *c;
 
-       c = cmd_special_alloc(h);
+       c = cmd_alloc(h);
        if (!c) {
                dev_warn(&h->pdev->dev, "out of memory in "
                        "wait_for_device_to_become_ready.\n");
@@ -4177,7 +4148,7 @@ static int wait_for_device_to_become_ready(struct ctlr_info *h,
        else
                dev_warn(&h->pdev->dev, "device is ready.\n");
 
-       cmd_special_free(h, c);
+       cmd_free(h, c);
        return rc;
 }
 
@@ -4227,13 +4198,15 @@ static void swizzle_abort_tag(u8 *tag)
 }
 
 static void hpsa_get_tag(struct ctlr_info *h,
-       struct CommandList *c, u32 *taglower, u32 *tagupper)
+       struct CommandList *c, __le32 *taglower, __le32 *tagupper)
 {
+       u64 tag;
        if (c->cmd_type == CMD_IOACCEL1) {
                struct io_accel1_cmd *cm1 = (struct io_accel1_cmd *)
                        &h->ioaccel_cmd_pool[c->cmdindex];
-               *tagupper = (u32) (cm1->tag >> 32);
-               *taglower = (u32) (cm1->tag & 0x0ffffffffULL);
+               tag = le64_to_cpu(cm1->tag);
+               *tagupper = cpu_to_le32(tag >> 32);
+               *taglower = cpu_to_le32(tag);
                return;
        }
        if (c->cmd_type == CMD_IOACCEL2) {
@@ -4244,8 +4217,9 @@ static void hpsa_get_tag(struct ctlr_info *h,
                *taglower = cm2->Tag;
                return;
        }
-       *tagupper = (u32) (c->Header.tag >> 32);
-       *taglower = (u32) (c->Header.tag & 0x0ffffffffULL);
+       tag = le64_to_cpu(c->Header.tag);
+       *tagupper = cpu_to_le32(tag >> 32);
+       *taglower = cpu_to_le32(tag);
 }
 
 static int hpsa_send_abort(struct ctlr_info *h, unsigned char *scsi3addr,
@@ -4254,11 +4228,11 @@ static int hpsa_send_abort(struct ctlr_info *h, unsigned char *scsi3addr,
        int rc = IO_OK;
        struct CommandList *c;
        struct ErrorInfo *ei;
-       u32 tagupper, taglower;
+       __le32 tagupper, taglower;
 
-       c = cmd_special_alloc(h);
+       c = cmd_alloc(h);
        if (c == NULL) {        /* trouble... */
-               dev_warn(&h->pdev->dev, "cmd_special_alloc returned NULL!\n");
+               dev_warn(&h->pdev->dev, "cmd_alloc returned NULL!\n");
                return -ENOMEM;
        }
 
@@ -4287,62 +4261,12 @@ static int hpsa_send_abort(struct ctlr_info *h, unsigned char *scsi3addr,
                rc = -1;
                break;
        }
-       cmd_special_free(h, c);
+       cmd_free(h, c);
        dev_dbg(&h->pdev->dev, "%s: Tag:0x%08x:%08x: Finished.\n",
                __func__, tagupper, taglower);
        return rc;
 }
 
-/*
- * hpsa_find_cmd_in_queue
- *
- * Used to determine whether a command (find) is still present
- * in queue_head.   Optionally excludes the last element of queue_head.
- *
- * This is used to avoid unnecessary aborts.  Commands in h->reqQ have
- * not yet been submitted, and so can be aborted by the driver without
- * sending an abort to the hardware.
- *
- * Returns pointer to command if found in queue, NULL otherwise.
- */
-static struct CommandList *hpsa_find_cmd_in_queue(struct ctlr_info *h,
-                       struct scsi_cmnd *find, struct list_head *queue_head)
-{
-       unsigned long flags;
-       struct CommandList *c = NULL;   /* ptr into cmpQ */
-
-       if (!find)
-               return NULL;
-       spin_lock_irqsave(&h->lock, flags);
-       list_for_each_entry(c, queue_head, list) {
-               if (c->scsi_cmd == NULL) /* e.g.: passthru ioctl */
-                       continue;
-               if (c->scsi_cmd == find) {
-                       spin_unlock_irqrestore(&h->lock, flags);
-                       return c;
-               }
-       }
-       spin_unlock_irqrestore(&h->lock, flags);
-       return NULL;
-}
-
-static struct CommandList *hpsa_find_cmd_in_queue_by_tag(struct ctlr_info *h,
-                                       u8 *tag, struct list_head *queue_head)
-{
-       unsigned long flags;
-       struct CommandList *c;
-
-       spin_lock_irqsave(&h->lock, flags);
-       list_for_each_entry(c, queue_head, list) {
-               if (memcmp(&c->Header.tag, tag, 8) != 0)
-                       continue;
-               spin_unlock_irqrestore(&h->lock, flags);
-               return c;
-       }
-       spin_unlock_irqrestore(&h->lock, flags);
-       return NULL;
-}
-
 /* ioaccel2 path firmware cannot handle abort task requests.
  * Change abort requests to physical target reset, and send to the
  * address of the physical disk used for the ioaccel 2 command.
@@ -4429,10 +4353,6 @@ static int hpsa_send_reset_as_abort_ioaccel2(struct ctlr_info *h,
 static int hpsa_send_abort_both_ways(struct ctlr_info *h,
        unsigned char *scsi3addr, struct CommandList *abort)
 {
-       u8 swizzled_tag[8];
-       struct CommandList *c;
-       int rc = 0, rc2 = 0;
-
        /* ioccelerator mode 2 commands should be aborted via the
         * accelerated path, since RAID path is unaware of these commands,
         * but underlying firmware can't handle abort TMF.
@@ -4441,27 +4361,8 @@ static int hpsa_send_abort_both_ways(struct ctlr_info *h,
        if (abort->cmd_type == CMD_IOACCEL2)
                return hpsa_send_reset_as_abort_ioaccel2(h, scsi3addr, abort);
 
-       /* we do not expect to find the swizzled tag in our queue, but
-        * check anyway just to be sure the assumptions which make this
-        * the case haven't become wrong.
-        */
-       memcpy(swizzled_tag, &abort->Request.CDB[4], 8);
-       swizzle_abort_tag(swizzled_tag);
-       c = hpsa_find_cmd_in_queue_by_tag(h, swizzled_tag, &h->cmpQ);
-       if (c != NULL) {
-               dev_warn(&h->pdev->dev, "Unexpectedly found byte-swapped tag in completion queue.\n");
-               return hpsa_send_abort(h, scsi3addr, abort, 0);
-       }
-       rc = hpsa_send_abort(h, scsi3addr, abort, 0);
-
-       /* if the command is still in our queue, we can't conclude that it was
-        * aborted (it might have just completed normally) but in any case
-        * we don't need to try to abort it another way.
-        */
-       c = hpsa_find_cmd_in_queue(h, abort->scsi_cmd, &h->cmpQ);
-       if (c)
-               rc2 = hpsa_send_abort(h, scsi3addr, abort, 1);
-       return rc && rc2;
+       return hpsa_send_abort(h, scsi3addr, abort, 0) &&
+                       hpsa_send_abort(h, scsi3addr, abort, 1);
 }
 
 /* Send an abort for the specified command.
@@ -4475,11 +4376,10 @@ static int hpsa_eh_abort_handler(struct scsi_cmnd *sc)
        struct ctlr_info *h;
        struct hpsa_scsi_dev_t *dev;
        struct CommandList *abort; /* pointer to command to be aborted */
-       struct CommandList *found;
        struct scsi_cmnd *as;   /* ptr to scsi cmd inside aborted command. */
        char msg[256];          /* For debug messaging. */
        int ml = 0;
-       u32 tagupper, taglower;
+       __le32 tagupper, taglower;
 
        /* Find the controller of the command to be aborted */
        h = sdev_to_hba(sc->device);
@@ -4521,28 +4421,6 @@ static int hpsa_eh_abort_handler(struct scsi_cmnd *sc)
        dev_dbg(&h->pdev->dev, "%s\n", msg);
        dev_warn(&h->pdev->dev, "Abort request on C%d:B%d:T%d:L%d\n",
                h->scsi_host->host_no, dev->bus, dev->target, dev->lun);
-
-       /* Search reqQ to See if command is queued but not submitted,
-        * if so, complete the command with aborted status and remove
-        * it from the reqQ.
-        */
-       found = hpsa_find_cmd_in_queue(h, sc, &h->reqQ);
-       if (found) {
-               found->err_info->CommandStatus = CMD_ABORTED;
-               finish_cmd(found);
-               dev_info(&h->pdev->dev, "%s Request SUCCEEDED (driver queue).\n",
-                               msg);
-               return SUCCESS;
-       }
-
-       /* not in reqQ, if also not in cmpQ, must have already completed */
-       found = hpsa_find_cmd_in_queue(h, sc, &h->cmpQ);
-       if (!found)  {
-               dev_dbg(&h->pdev->dev, "%s Request SUCCEEDED (not known to driver).\n",
-                               msg);
-               return SUCCESS;
-       }
-
        /*
         * Command is in flight, or possibly already completed
         * by the firmware (but not to the scsi mid layer) but we can't
@@ -4565,10 +4443,12 @@ static int hpsa_eh_abort_handler(struct scsi_cmnd *sc)
         */
 #define ABORT_COMPLETE_WAIT_SECS 30
        for (i = 0; i < ABORT_COMPLETE_WAIT_SECS * 10; i++) {
-               found = hpsa_find_cmd_in_queue(h, sc, &h->cmpQ);
-               if (!found)
+               if (test_bit(abort->cmdindex & (BITS_PER_LONG - 1),
+                               h->cmd_pool_bits +
+                               (abort->cmdindex / BITS_PER_LONG)))
+                       msleep(100);
+               else
                        return SUCCESS;
-               msleep(100);
        }
        dev_warn(&h->pdev->dev, "%s FAILED. Aborted command has not completed after %d seconds.\n",
                msg, ABORT_COMPLETE_WAIT_SECS);
@@ -4617,8 +4497,8 @@ static struct CommandList *cmd_alloc(struct ctlr_info *h)
 
        c = h->cmd_pool + i;
        memset(c, 0, sizeof(*c));
-       cmd_dma_handle = h->cmd_pool_dhandle
-           + i * sizeof(*c);
+       c->Header.tag = cpu_to_le64((u64) i << DIRECT_LOOKUP_SHIFT);
+       cmd_dma_handle = h->cmd_pool_dhandle + i * sizeof(*c);
        c->err_info = h->errinfo_pool + i;
        memset(c->err_info, 0, sizeof(*c->err_info));
        err_dma_handle = h->errinfo_pool_dhandle
@@ -4626,7 +4506,6 @@ static struct CommandList *cmd_alloc(struct ctlr_info *h)
 
        c->cmdindex = i;
 
-       INIT_LIST_HEAD(&c->list);
        c->busaddr = (u32) cmd_dma_handle;
        temp64.val = (u64) err_dma_handle;
        c->ErrDesc.Addr = cpu_to_le64(err_dma_handle);
@@ -4636,40 +4515,6 @@ static struct CommandList *cmd_alloc(struct ctlr_info *h)
        return c;
 }
 
-/* For operations that can wait for kmalloc to possibly sleep,
- * this routine can be called. Lock need not be held to call
- * cmd_special_alloc. cmd_special_free() is the complement.
- */
-static struct CommandList *cmd_special_alloc(struct ctlr_info *h)
-{
-       struct CommandList *c;
-       dma_addr_t cmd_dma_handle, err_dma_handle;
-
-       c = pci_zalloc_consistent(h->pdev, sizeof(*c), &cmd_dma_handle);
-       if (c == NULL)
-               return NULL;
-
-       c->cmd_type = CMD_SCSI;
-       c->cmdindex = -1;
-
-       c->err_info = pci_zalloc_consistent(h->pdev, sizeof(*c->err_info),
-                                           &err_dma_handle);
-
-       if (c->err_info == NULL) {
-               pci_free_consistent(h->pdev,
-                       sizeof(*c), c, cmd_dma_handle);
-               return NULL;
-       }
-
-       INIT_LIST_HEAD(&c->list);
-       c->busaddr = (u32) cmd_dma_handle;
-       c->ErrDesc.Addr = cpu_to_le64(err_dma_handle);
-       c->ErrDesc.Len = cpu_to_le32(sizeof(*c->err_info));
-
-       c->h = h;
-       return c;
-}
-
 static void cmd_free(struct ctlr_info *h, struct CommandList *c)
 {
        int i;
@@ -4679,15 +4524,6 @@ static void cmd_free(struct ctlr_info *h, struct CommandList *c)
                  h->cmd_pool_bits + (i / BITS_PER_LONG));
 }
 
-static void cmd_special_free(struct ctlr_info *h, struct CommandList *c)
-{
-       pci_free_consistent(h->pdev, sizeof(*c->err_info),
-                           c->err_info,
-                           (dma_addr_t) le64_to_cpu(c->ErrDesc.Addr));
-       pci_free_consistent(h->pdev, sizeof(*c),
-                           c, (dma_addr_t) (c->busaddr & DIRECT_LOOKUP_MASK));
-}
-
 #ifdef CONFIG_COMPAT
 
 static int hpsa_ioctl32_passthru(struct scsi_device *dev, int cmd,
@@ -4866,7 +4702,7 @@ static int hpsa_passthru_ioctl(struct ctlr_info *h, void __user *argp)
                        memset(buff, 0, iocommand.buf_size);
                }
        }
-       c = cmd_special_alloc(h);
+       c = cmd_alloc(h);
        if (c == NULL) {
                rc = -ENOMEM;
                goto out_kfree;
@@ -4883,8 +4719,6 @@ static int hpsa_passthru_ioctl(struct ctlr_info *h, void __user *argp)
                c->Header.SGTotal = cpu_to_le16(0);
        }
        memcpy(&c->Header.LUN, &iocommand.LUN_info, sizeof(c->Header.LUN));
-       /* use the kernel address the cmd block for tag */
-       c->Header.tag = c->busaddr;
 
        /* Fill in Request block */
        memcpy(&c->Request, &iocommand.Request,
@@ -4925,7 +4759,7 @@ static int hpsa_passthru_ioctl(struct ctlr_info *h, void __user *argp)
                }
        }
 out:
-       cmd_special_free(h, c);
+       cmd_free(h, c);
 out_kfree:
        kfree(buff);
        return rc;
@@ -4940,7 +4774,6 @@ static int hpsa_big_passthru_ioctl(struct ctlr_info *h, void __user *argp)
        u64 temp64;
        BYTE sg_used = 0;
        int status = 0;
-       int i;
        u32 left;
        u32 sz;
        BYTE __user *data_ptr;
@@ -5004,7 +4837,7 @@ static int hpsa_big_passthru_ioctl(struct ctlr_info *h, void __user *argp)
                data_ptr += sz;
                sg_used++;
        }
-       c = cmd_special_alloc(h);
+       c = cmd_alloc(h);
        if (c == NULL) {
                status = -ENOMEM;
                goto cleanup1;
@@ -5014,7 +4847,6 @@ static int hpsa_big_passthru_ioctl(struct ctlr_info *h, void __user *argp)
        c->Header.SGList = (u8) sg_used;
        c->Header.SGTotal = cpu_to_le16(sg_used);
        memcpy(&c->Header.LUN, &ioc->LUN_info, sizeof(c->Header.LUN));
-       c->Header.tag = c->busaddr;
        memcpy(&c->Request, &ioc->Request, sizeof(c->Request));
        if (ioc->buf_size > 0) {
                int i;
@@ -5047,6 +4879,8 @@ static int hpsa_big_passthru_ioctl(struct ctlr_info *h, void __user *argp)
                goto cleanup0;
        }
        if ((ioc->Request.Type.Direction & XFER_READ) && ioc->buf_size > 0) {
+               int i;
+
                /* Copy the data out of the buffer we created */
                BYTE __user *ptr = ioc->buf;
                for (i = 0; i < sg_used; i++) {
@@ -5059,9 +4893,11 @@ static int hpsa_big_passthru_ioctl(struct ctlr_info *h, void __user *argp)
        }
        status = 0;
 cleanup0:
-       cmd_special_free(h, c);
+       cmd_free(h, c);
 cleanup1:
        if (buff) {
+               int i;
+
                for (i = 0; i < sg_used; i++)
                        kfree(buff[i]);
                kfree(buff);
@@ -5173,7 +5009,6 @@ static int fill_cmd(struct CommandList *c, u8 cmd, struct ctlr_info *h,
 {
        int pci_dir = XFER_NONE;
        struct CommandList *a; /* for commands to be aborted */
-       u32 tupper, tlower;
 
        c->cmd_type = CMD_IOCTL_PEND;
        c->Header.ReplyQueue = 0;
@@ -5184,7 +5019,6 @@ static int fill_cmd(struct CommandList *c, u8 cmd, struct ctlr_info *h,
                c->Header.SGList = 0;
                c->Header.SGTotal = cpu_to_le16(0);
        }
-       c->Header.tag = c->busaddr;
        memcpy(c->Header.LUN.LunAddrBytes, scsi3addr, 8);
 
        if (cmd_type == TYPE_CMD) {
@@ -5281,10 +5115,9 @@ static int fill_cmd(struct CommandList *c, u8 cmd, struct ctlr_info *h,
                        break;
                case  HPSA_ABORT_MSG:
                        a = buff;       /* point to command to be aborted */
-                       dev_dbg(&h->pdev->dev, "Abort Tag:0x%016llx using request Tag:0x%016llx",
+                       dev_dbg(&h->pdev->dev,
+                               "Abort Tag:0x%016llx request Tag:0x%016llx",
                                a->Header.tag, c->Header.tag);
-                       tlower = (u32) (a->Header.tag >> 32);
-                       tupper = (u32) (a->Header.tag & 0x0ffffffffULL);
                        c->Request.CDBLen = 16;
                        c->Request.type_attr_dir =
                                        TYPE_ATTR_DIR(cmd_type,
@@ -5295,14 +5128,8 @@ static int fill_cmd(struct CommandList *c, u8 cmd, struct ctlr_info *h,
                        c->Request.CDB[2] = 0x00; /* reserved */
                        c->Request.CDB[3] = 0x00; /* reserved */
                        /* Tag to abort goes in CDB[4]-CDB[11] */
-                       c->Request.CDB[4] = tlower & 0xFF;
-                       c->Request.CDB[5] = (tlower >> 8) & 0xFF;
-                       c->Request.CDB[6] = (tlower >> 16) & 0xFF;
-                       c->Request.CDB[7] = (tlower >> 24) & 0xFF;
-                       c->Request.CDB[8] = tupper & 0xFF;
-                       c->Request.CDB[9] = (tupper >> 8) & 0xFF;
-                       c->Request.CDB[10] = (tupper >> 16) & 0xFF;
-                       c->Request.CDB[11] = (tupper >> 24) & 0xFF;
+                       memcpy(&c->Request.CDB[4], &a->Header.tag,
+                               sizeof(a->Header.tag));
                        c->Request.CDB[12] = 0x00; /* reserved */
                        c->Request.CDB[13] = 0x00; /* reserved */
                        c->Request.CDB[14] = 0x00; /* reserved */
@@ -5349,47 +5176,6 @@ static void __iomem *remap_pci_mem(ulong base, ulong size)
        return page_remapped ? (page_remapped + page_offs) : NULL;
 }
 
-/* Takes cmds off the submission queue and sends them to the hardware,
- * then puts them on the queue of cmds waiting for completion.
- * Assumes h->lock is held
- */
-static void start_io(struct ctlr_info *h, unsigned long *flags)
-{
-       struct CommandList *c;
-
-       while (!list_empty(&h->reqQ)) {
-               c = list_entry(h->reqQ.next, struct CommandList, list);
-               /* can't do anything if fifo is full */
-               if ((h->access.fifo_full(h))) {
-                       h->fifo_recently_full = 1;
-                       dev_warn(&h->pdev->dev, "fifo full\n");
-                       break;
-               }
-               h->fifo_recently_full = 0;
-
-               /* Get the first entry from the Request Q */
-               removeQ(c);
-               h->Qdepth--;
-
-               /* Put job onto the completed Q */
-               addQ(&h->cmpQ, c);
-               atomic_inc(&h->commands_outstanding);
-               spin_unlock_irqrestore(&h->lock, *flags);
-               /* Tell the controller execute command */
-               h->access.submit_command(h, c);
-               spin_lock_irqsave(&h->lock, *flags);
-       }
-}
-
-static void lock_and_start_io(struct ctlr_info *h)
-{
-       unsigned long flags;
-
-       spin_lock_irqsave(&h->lock, flags);
-       start_io(h, &flags);
-       spin_unlock_irqrestore(&h->lock, flags);
-}
-
 static inline unsigned long get_next_completion(struct ctlr_info *h, u8 q)
 {
        return h->access.command_completed(h, q);
@@ -5418,53 +5204,12 @@ static inline int bad_tag(struct ctlr_info *h, u32 tag_index,
 
 static inline void finish_cmd(struct CommandList *c)
 {
-       unsigned long flags;
-       int io_may_be_stalled = 0;
-       struct ctlr_info *h = c->h;
-       int count;
-
-       spin_lock_irqsave(&h->lock, flags);
-       removeQ(c);
-
-       /*
-        * Check for possibly stalled i/o.
-        *
-        * If a fifo_full condition is encountered, requests will back up
-        * in h->reqQ.  This queue is only emptied out by start_io which is
-        * only called when a new i/o request comes in.  If no i/o's are
-        * forthcoming, the i/o's in h->reqQ can get stuck.  So we call
-        * start_io from here if we detect such a danger.
-        *
-        * Normally, we shouldn't hit this case, but pounding on the
-        * CCISS_PASSTHRU ioctl can provoke it.  Only call start_io if
-        * commands_outstanding is low.  We want to avoid calling
-        * start_io from in here as much as possible, and esp. don't
-        * want to get in a cycle where we call start_io every time
-        * through here.
-        */
-       count = atomic_read(&h->commands_outstanding);
-       spin_unlock_irqrestore(&h->lock, flags);
-       if (unlikely(h->fifo_recently_full) && count < 5)
-               io_may_be_stalled = 1;
-
        dial_up_lockup_detection_on_fw_flash_complete(c->h, c);
        if (likely(c->cmd_type == CMD_IOACCEL1 || c->cmd_type == CMD_SCSI
                        || c->cmd_type == CMD_IOACCEL2))
                complete_scsi_command(c);
        else if (c->cmd_type == CMD_IOCTL_PEND)
                complete(c->waiting);
-       if (unlikely(io_may_be_stalled))
-               lock_and_start_io(h);
-}
-
-static inline u32 hpsa_tag_contains_index(u32 tag)
-{
-       return tag & DIRECT_LOOKUP_BIT;
-}
-
-static inline u32 hpsa_tag_to_index(u32 tag)
-{
-       return tag >> DIRECT_LOOKUP_SHIFT;
 }
 
 
@@ -5484,34 +5229,13 @@ static inline void process_indexed_cmd(struct ctlr_info *h,
        u32 tag_index;
        struct CommandList *c;
 
-       tag_index = hpsa_tag_to_index(raw_tag);
+       tag_index = raw_tag >> DIRECT_LOOKUP_SHIFT;
        if (!bad_tag(h, tag_index, raw_tag)) {
                c = h->cmd_pool + tag_index;
                finish_cmd(c);
        }
 }
 
-/* process completion of a non-indexed command */
-static inline void process_nonindexed_cmd(struct ctlr_info *h,
-       u32 raw_tag)
-{
-       u32 tag;
-       struct CommandList *c = NULL;
-       unsigned long flags;
-
-       tag = hpsa_tag_discard_error_bits(h, raw_tag);
-       spin_lock_irqsave(&h->lock, flags);
-       list_for_each_entry(c, &h->cmpQ, list) {
-               if ((c->busaddr & 0xFFFFFFE0) == (tag & 0xFFFFFFE0)) {
-                       spin_unlock_irqrestore(&h->lock, flags);
-                       finish_cmd(c);
-                       return;
-               }
-       }
-       spin_unlock_irqrestore(&h->lock, flags);
-       bad_tag(h, h->nr_cmds + 1, raw_tag);
-}
-
 /* Some controllers, like p400, will give us one interrupt
  * after a soft reset, even if we turned interrupts off.
  * Only need to check for this in the hpsa_xxx_discard_completions
@@ -5589,10 +5313,7 @@ static irqreturn_t do_hpsa_intr_intx(int irq, void *queue)
        while (interrupt_pending(h)) {
                raw_tag = get_next_completion(h, q);
                while (raw_tag != FIFO_EMPTY) {
-                       if (likely(hpsa_tag_contains_index(raw_tag)))
-                               process_indexed_cmd(h, raw_tag);
-                       else
-                               process_nonindexed_cmd(h, raw_tag);
+                       process_indexed_cmd(h, raw_tag);
                        raw_tag = next_command(h, q);
                }
        }
@@ -5608,10 +5329,7 @@ static irqreturn_t do_hpsa_intr_msi(int irq, void *queue)
        h->last_intr_timestamp = get_jiffies_64();
        raw_tag = get_next_completion(h, q);
        while (raw_tag != FIFO_EMPTY) {
-               if (likely(hpsa_tag_contains_index(raw_tag)))
-                       process_indexed_cmd(h, raw_tag);
-               else
-                       process_nonindexed_cmd(h, raw_tag);
+               process_indexed_cmd(h, raw_tag);
                raw_tag = next_command(h, q);
        }
        return IRQ_HANDLED;
@@ -5633,7 +5351,8 @@ static int hpsa_message(struct pci_dev *pdev, unsigned char opcode,
        static const size_t cmd_sz = sizeof(*cmd) +
                                        sizeof(cmd->ErrorDescriptor);
        dma_addr_t paddr64;
-       uint32_t paddr32, tag;
+       __le32 paddr32;
+       u32 tag;
        void __iomem *vaddr;
        int i, err;
 
@@ -5648,7 +5367,7 @@ static int hpsa_message(struct pci_dev *pdev, unsigned char opcode,
        err = pci_set_consistent_dma_mask(pdev, DMA_BIT_MASK(32));
        if (err) {
                iounmap(vaddr);
-               return -ENOMEM;
+               return err;
        }
 
        cmd = pci_alloc_consistent(pdev, cmd_sz, &paddr64);
@@ -5661,12 +5380,12 @@ static int hpsa_message(struct pci_dev *pdev, unsigned char opcode,
         * although there's no guarantee, we assume that the address is at
         * least 4-byte aligned (most likely, it's page-aligned).
         */
-       paddr32 = paddr64;
+       paddr32 = cpu_to_le32(paddr64);
 
        cmd->CommandHeader.ReplyQueue = 0;
        cmd->CommandHeader.SGList = 0;
        cmd->CommandHeader.SGTotal = cpu_to_le16(0);
-       cmd->CommandHeader.tag = paddr32;
+       cmd->CommandHeader.tag = cpu_to_le64(paddr64);
        memset(&cmd->CommandHeader.LUN.LunAddrBytes, 0, 8);
 
        cmd->Request.CDBLen = 16;
@@ -5677,14 +5396,14 @@ static int hpsa_message(struct pci_dev *pdev, unsigned char opcode,
        cmd->Request.CDB[1] = type;
        memset(&cmd->Request.CDB[2], 0, 14); /* rest of the CDB is reserved */
        cmd->ErrorDescriptor.Addr =
-                       cpu_to_le64((paddr32 + sizeof(*cmd)));
+                       cpu_to_le64((le32_to_cpu(paddr32) + sizeof(*cmd)));
        cmd->ErrorDescriptor.Len = cpu_to_le32(sizeof(struct ErrorInfo));
 
-       writel(paddr32, vaddr + SA5_REQUEST_PORT_OFFSET);
+       writel(le32_to_cpu(paddr32), vaddr + SA5_REQUEST_PORT_OFFSET);
 
        for (i = 0; i < HPSA_MSG_SEND_RETRY_LIMIT; i++) {
                tag = readl(vaddr + SA5_REPLY_PORT_OFFSET);
-               if ((tag & ~HPSA_SIMPLE_ERROR_BITS) == paddr32)
+               if ((tag & ~HPSA_SIMPLE_ERROR_BITS) == paddr64)
                        break;
                msleep(HPSA_MSG_SEND_RETRY_INTERVAL_MSECS);
        }
@@ -5718,8 +5437,6 @@ static int hpsa_message(struct pci_dev *pdev, unsigned char opcode,
 static int hpsa_controller_hard_reset(struct pci_dev *pdev,
        void __iomem *vaddr, u32 use_doorbell)
 {
-       u16 pmcsr;
-       int pos;
 
        if (use_doorbell) {
                /* For everything after the P600, the PCI power state method
@@ -5745,26 +5462,21 @@ static int hpsa_controller_hard_reset(struct pci_dev *pdev,
                 * this causes a secondary PCI reset which will reset the
                 * controller." */
 
-               pos = pci_find_capability(pdev, PCI_CAP_ID_PM);
-               if (pos == 0) {
-                       dev_err(&pdev->dev,
-                               "hpsa_reset_controller: "
-                               "PCI PM not supported\n");
-                       return -ENODEV;
-               }
+               int rc = 0;
+
                dev_info(&pdev->dev, "using PCI PM to reset controller\n");
+
                /* enter the D3hot power management state */
-               pci_read_config_word(pdev, pos + PCI_PM_CTRL, &pmcsr);
-               pmcsr &= ~PCI_PM_CTRL_STATE_MASK;
-               pmcsr |= PCI_D3hot;
-               pci_write_config_word(pdev, pos + PCI_PM_CTRL, pmcsr);
+               rc = pci_set_power_state(pdev, PCI_D3hot);
+               if (rc)
+                       return rc;
 
                msleep(500);
 
                /* enter the D0 power management state */
-               pmcsr &= ~PCI_PM_CTRL_STATE_MASK;
-               pmcsr |= PCI_D0;
-               pci_write_config_word(pdev, pos + PCI_PM_CTRL, pmcsr);
+               rc = pci_set_power_state(pdev, PCI_D0);
+               if (rc)
+                       return rc;
 
                /*
                 * The P600 requires a small delay when changing states.
@@ -5858,8 +5570,12 @@ static int hpsa_kdump_hard_reset_controller(struct pci_dev *pdev)
         */
 
        rc = hpsa_lookup_board_id(pdev, &board_id);
-       if (rc < 0 || !ctlr_is_resettable(board_id)) {
-               dev_warn(&pdev->dev, "Not resetting device.\n");
+       if (rc < 0) {
+               dev_warn(&pdev->dev, "Board ID not found\n");
+               return rc;
+       }
+       if (!ctlr_is_resettable(board_id)) {
+               dev_warn(&pdev->dev, "Controller not resettable\n");
                return -ENODEV;
        }
 
@@ -5892,7 +5608,7 @@ static int hpsa_kdump_hard_reset_controller(struct pci_dev *pdev)
        }
        rc = write_driver_ver_to_cfgtable(cfgtable);
        if (rc)
-               goto unmap_vaddr;
+               goto unmap_cfgtable;
 
        /* If reset via doorbell register is supported, use that.
         * There are two such methods.  Favor the newest method.
@@ -5904,8 +5620,8 @@ static int hpsa_kdump_hard_reset_controller(struct pci_dev *pdev)
        } else {
                use_doorbell = misc_fw_support & MISC_FW_DOORBELL_RESET;
                if (use_doorbell) {
-                       dev_warn(&pdev->dev, "Soft reset not supported. "
-                               "Firmware update is required.\n");
+                       dev_warn(&pdev->dev,
+                               "Soft reset not supported. Firmware update is required.\n");
                        rc = -ENOTSUPP; /* try soft reset */
                        goto unmap_cfgtable;
                }
@@ -5925,8 +5641,7 @@ static int hpsa_kdump_hard_reset_controller(struct pci_dev *pdev)
        rc = hpsa_wait_for_board_state(pdev, vaddr, BOARD_READY);
        if (rc) {
                dev_warn(&pdev->dev,
-                       "failed waiting for board to become ready "
-                       "after hard reset\n");
+                       "Failed waiting for board to become ready after hard reset\n");
                goto unmap_cfgtable;
        }
 
@@ -5977,7 +5692,7 @@ static void print_cfg_table(struct device *dev, struct CfgTable __iomem *tb)
               readl(&(tb->HostWrite.CoalIntDelay)));
        dev_info(dev, "   Coalesce Interrupt Count = 0x%x\n",
               readl(&(tb->HostWrite.CoalIntCount)));
-       dev_info(dev, "   Max outstanding commands = 0x%d\n",
+       dev_info(dev, "   Max outstanding commands = %d\n",
               readl(&(tb->CmdsOutMax)));
        dev_info(dev, "   Bus Types = 0x%x\n", readl(&(tb->BusTypes)));
        for (i = 0; i < 16; i++)
@@ -6025,7 +5740,7 @@ static int find_PCI_BAR_index(struct pci_dev *pdev, unsigned long pci_bar_addr)
 }
 
 /* If MSI/MSI-X is supported by the kernel we will try to enable it on
- * controllers that are capable. If not, we use IO-APIC mode.
+ * controllers that are capable. If not, we use legacy INTx mode.
  */
 
 static void hpsa_interrupt_mode(struct ctlr_info *h)
@@ -6044,7 +5759,7 @@ static void hpsa_interrupt_mode(struct ctlr_info *h)
            (h->board_id == 0x40820E11) || (h->board_id == 0x40830E11))
                goto default_int_mode;
        if (pci_find_capability(h->pdev, PCI_CAP_ID_MSIX)) {
-               dev_info(&h->pdev->dev, "MSIX\n");
+               dev_info(&h->pdev->dev, "MSI-X capable controller\n");
                h->msix_vector = MAX_REPLY_QUEUES;
                if (h->msix_vector > num_online_cpus())
                        h->msix_vector = num_online_cpus();
@@ -6065,7 +5780,7 @@ static void hpsa_interrupt_mode(struct ctlr_info *h)
        }
 single_msi_mode:
        if (pci_find_capability(h->pdev, PCI_CAP_ID_MSI)) {
-               dev_info(&h->pdev->dev, "MSI\n");
+               dev_info(&h->pdev->dev, "MSI capable controller\n");
                if (!pci_enable_msi(h->pdev))
                        h->msi_vector = 1;
                else
@@ -6172,8 +5887,10 @@ static int hpsa_find_cfgtables(struct ctlr_info *h)
                return rc;
        h->cfgtable = remap_pci_mem(pci_resource_start(h->pdev,
                       cfg_base_addr_index) + cfg_offset, sizeof(*h->cfgtable));
-       if (!h->cfgtable)
+       if (!h->cfgtable) {
+               dev_err(&h->pdev->dev, "Failed mapping cfgtable\n");
                return -ENOMEM;
+       }
        rc = write_driver_ver_to_cfgtable(h->cfgtable);
        if (rc)
                return rc;
@@ -6204,6 +5921,15 @@ static void hpsa_get_max_perf_mode_cmds(struct ctlr_info *h)
        }
 }
 
+/* If the controller reports that the total max sg entries is greater than 512,
+ * then we know that chained SG blocks work.  (Original smart arrays did not
+ * support chained SG blocks and would return zero for max sg entries.)
+ */
+static int hpsa_supports_chained_sg_blocks(struct ctlr_info *h)
+{
+       return h->maxsgentries > 512;
+}
+
 /* Interrogate the hardware for some limits:
  * max commands, max SG elements without chaining, and with chaining,
  * SG chain block size, etc.
@@ -6211,21 +5937,23 @@ static void hpsa_get_max_perf_mode_cmds(struct ctlr_info *h)
 static void hpsa_find_board_params(struct ctlr_info *h)
 {
        hpsa_get_max_perf_mode_cmds(h);
-       h->nr_cmds = h->max_commands - 4; /* Allow room for some ioctls */
+       h->nr_cmds = h->max_commands;
        h->maxsgentries = readl(&(h->cfgtable->MaxScatterGatherElements));
        h->fw_support = readl(&(h->cfgtable->misc_fw_support));
-       /*
-        * Limit in-command s/g elements to 32 save dma'able memory.
-        * Howvever spec says if 0, use 31
-        */
-       h->max_cmd_sg_entries = 31;
-       if (h->maxsgentries > 512) {
+       if (hpsa_supports_chained_sg_blocks(h)) {
+               /* Limit in-command s/g elements to 32 save dma'able memory. */
                h->max_cmd_sg_entries = 32;
                h->chainsize = h->maxsgentries - h->max_cmd_sg_entries;
                h->maxsgentries--; /* save one for chain pointer */
        } else {
-               h->chainsize = 0;
+               /*
+                * Original smart arrays supported at most 31 s/g entries
+                * embedded inline in the command (trying to use more
+                * would lock up the controller)
+                */
+               h->max_cmd_sg_entries = 31;
                h->maxsgentries = 31; /* default to traditional values */
+               h->chainsize = 0;
        }
 
        /* Find out what task management functions are supported and cache */
@@ -6239,7 +5967,7 @@ static void hpsa_find_board_params(struct ctlr_info *h)
 static inline bool hpsa_CISS_signature_present(struct ctlr_info *h)
 {
        if (!check_signature(h->cfgtable->Signature, "CISS", 4)) {
-               dev_warn(&h->pdev->dev, "not a valid CISS config table\n");
+               dev_err(&h->pdev->dev, "not a valid CISS config table\n");
                return false;
        }
        return true;
@@ -6331,7 +6059,7 @@ static int hpsa_enter_simple_mode(struct ctlr_info *h)
        h->transMethod = CFGTBL_Trans_Simple;
        return 0;
 error:
-       dev_warn(&h->pdev->dev, "unable to get board into simple mode\n");
+       dev_err(&h->pdev->dev, "failed to enter simple mode\n");
        return -ENODEV;
 }
 
@@ -6341,7 +6069,7 @@ static int hpsa_pci_init(struct ctlr_info *h)
 
        prod_index = hpsa_lookup_board_id(h->pdev, &h->board_id);
        if (prod_index < 0)
-               return -ENODEV;
+               return prod_index;
        h->product_name = products[prod_index].product_name;
        h->access = *(products[prod_index].access);
 
@@ -6422,6 +6150,7 @@ static void hpsa_hba_inquiry(struct ctlr_info *h)
 static int hpsa_init_reset_devices(struct pci_dev *pdev)
 {
        int rc, i;
+       void __iomem *vaddr;
 
        if (!reset_devices)
                return 0;
@@ -6445,6 +6174,14 @@ static int hpsa_init_reset_devices(struct pci_dev *pdev)
 
        pci_set_master(pdev);
 
+       vaddr = pci_ioremap_bar(pdev, 0);
+       if (vaddr == NULL) {
+               rc = -ENOMEM;
+               goto out_disable;
+       }
+       writel(SA5_INTR_OFF, vaddr + SA5_REPLY_INTR_MASK_OFFSET);
+       iounmap(vaddr);
+
        /* Reset the controller with a PCI power-cycle or via doorbell */
        rc = hpsa_kdump_hard_reset_controller(pdev);
 
@@ -6453,14 +6190,11 @@ static int hpsa_init_reset_devices(struct pci_dev *pdev)
         * "performant mode".  Or, it might be 640x, which can't reset
         * due to concerns about shared bbwc between 6402/6404 pair.
         */
-       if (rc) {
-               if (rc != -ENOTSUPP) /* just try to do the kdump anyhow. */
-                       rc = -ENODEV;
+       if (rc)
                goto out_disable;
-       }
 
        /* Now try to get the controller to respond to a no-op */
-       dev_warn(&pdev->dev, "Waiting for controller to respond to no-op\n");
+       dev_info(&pdev->dev, "Waiting for controller to respond to no-op\n");
        for (i = 0; i < HPSA_POST_RESET_NOOP_RETRIES; i++) {
                if (hpsa_noop(pdev) == 0)
                        break;
@@ -6490,9 +6224,12 @@ static int hpsa_allocate_cmd_pool(struct ctlr_info *h)
            || (h->cmd_pool == NULL)
            || (h->errinfo_pool == NULL)) {
                dev_err(&h->pdev->dev, "out of memory in %s", __func__);
-               return -ENOMEM;
+               goto clean_up;
        }
        return 0;
+clean_up:
+       hpsa_free_cmd_pool(h);
+       return -ENOMEM;
 }
 
 static void hpsa_free_cmd_pool(struct ctlr_info *h)
@@ -6519,16 +6256,38 @@ static void hpsa_free_cmd_pool(struct ctlr_info *h)
 
 static void hpsa_irq_affinity_hints(struct ctlr_info *h)
 {
-       int i, cpu, rc;
+       int i, cpu;
 
        cpu = cpumask_first(cpu_online_mask);
        for (i = 0; i < h->msix_vector; i++) {
-               rc = irq_set_affinity_hint(h->intr[i], get_cpu_mask(cpu));
+               irq_set_affinity_hint(h->intr[i], get_cpu_mask(cpu));
                cpu = cpumask_next(cpu, cpu_online_mask);
        }
 }
 
-static int hpsa_request_irq(struct ctlr_info *h,
+/* clear affinity hints and free MSI-X, MSI, or legacy INTx vectors */
+static void hpsa_free_irqs(struct ctlr_info *h)
+{
+       int i;
+
+       if (!h->msix_vector || h->intr_mode != PERF_MODE_INT) {
+               /* Single reply queue, only one irq to free */
+               i = h->intr_mode;
+               irq_set_affinity_hint(h->intr[i], NULL);
+               free_irq(h->intr[i], &h->q[i]);
+               return;
+       }
+
+       for (i = 0; i < h->msix_vector; i++) {
+               irq_set_affinity_hint(h->intr[i], NULL);
+               free_irq(h->intr[i], &h->q[i]);
+       }
+       for (; i < MAX_REPLY_QUEUES; i++)
+               h->q[i] = 0;
+}
+
+/* returns 0 on success; cleans up and returns -Enn on error */
+static int hpsa_request_irqs(struct ctlr_info *h,
        irqreturn_t (*msixhandler)(int, void *),
        irqreturn_t (*intxhandler)(int, void *))
 {
@@ -6543,10 +6302,25 @@ static int hpsa_request_irq(struct ctlr_info *h,
 
        if (h->intr_mode == PERF_MODE_INT && h->msix_vector > 0) {
                /* If performant mode and MSI-X, use multiple reply queues */
-               for (i = 0; i < h->msix_vector; i++)
+               for (i = 0; i < h->msix_vector; i++) {
                        rc = request_irq(h->intr[i], msixhandler,
                                        0, h->devname,
                                        &h->q[i]);
+                       if (rc) {
+                               int j;
+
+                               dev_err(&h->pdev->dev,
+                                       "failed to get irq %d for %s\n",
+                                      h->intr[i], h->devname);
+                               for (j = 0; j < i; j++) {
+                                       free_irq(h->intr[j], &h->q[j]);
+                                       h->q[j] = 0;
+                               }
+                               for (; j < MAX_REPLY_QUEUES; j++)
+                                       h->q[j] = 0;
+                               return rc;
+                       }
+               }
                hpsa_irq_affinity_hints(h);
        } else {
                /* Use single reply pool */
@@ -6592,27 +6366,9 @@ static int hpsa_kdump_soft_reset(struct ctlr_info *h)
        return 0;
 }
 
-static void free_irqs(struct ctlr_info *h)
-{
-       int i;
-
-       if (!h->msix_vector || h->intr_mode != PERF_MODE_INT) {
-               /* Single reply queue, only one irq to free */
-               i = h->intr_mode;
-               irq_set_affinity_hint(h->intr[i], NULL);
-               free_irq(h->intr[i], &h->q[i]);
-               return;
-       }
-
-       for (i = 0; i < h->msix_vector; i++) {
-               irq_set_affinity_hint(h->intr[i], NULL);
-               free_irq(h->intr[i], &h->q[i]);
-       }
-}
-
 static void hpsa_free_irqs_and_disable_msix(struct ctlr_info *h)
 {
-       free_irqs(h);
+       hpsa_free_irqs(h);
 #ifdef CONFIG_PCI_MSI
        if (h->msix_vector) {
                if (h->pdev->msix_enabled)
@@ -6658,14 +6414,17 @@ static void hpsa_undo_allocations_after_kdump_soft_reset(struct ctlr_info *h)
 }
 
 /* Called when controller lockup detected. */
-static void fail_all_cmds_on_list(struct ctlr_info *h, struct list_head *list)
+static void fail_all_outstanding_cmds(struct ctlr_info *h)
 {
+       int i;
        struct CommandList *c = NULL;
 
-       assert_spin_locked(&h->lock);
-       /* Mark all outstanding commands as failed and complete them. */
-       while (!list_empty(list)) {
-               c = list_entry(list->next, struct CommandList, list);
+       flush_workqueue(h->resubmit_wq); /* ensure all cmds are fully built */
+       for (i = 0; i < h->nr_cmds; i++) {
+               if (!test_bit(i & (BITS_PER_LONG - 1),
+                               h->cmd_pool_bits + (i / BITS_PER_LONG)))
+                       continue;
+               c = h->cmd_pool + i;
                c->err_info->CommandStatus = CMD_HARDWARE_ERR;
                finish_cmd(c);
        }
@@ -6705,8 +6464,7 @@ static void controller_lockup_detected(struct ctlr_info *h)
                        lockup_detected);
        pci_disable_device(h->pdev);
        spin_lock_irqsave(&h->lock, flags);
-       fail_all_cmds_on_list(h, &h->cmpQ);
-       fail_all_cmds_on_list(h, &h->reqQ);
+       fail_all_outstanding_cmds(h);
        spin_unlock_irqrestore(&h->lock, flags);
 }
 
@@ -6750,9 +6508,6 @@ static void hpsa_ack_ctlr_events(struct ctlr_info *h)
        int i;
        char *event_type;
 
-       /* Clear the driver-requested rescan flag */
-       h->drv_req_rescan = 0;
-
        /* Ask the controller to clear the events we're handling. */
        if ((h->transMethod & (CFGTBL_Trans_io_accel1
                        | CFGTBL_Trans_io_accel2)) &&
@@ -6798,9 +6553,6 @@ static void hpsa_ack_ctlr_events(struct ctlr_info *h)
  */
 static int hpsa_ctlr_needs_rescan(struct ctlr_info *h)
 {
-       if (h->drv_req_rescan)
-               return 1;
-
        if (!(h->fw_support & MISC_FW_EVENT_NOTIFY))
                return 0;
 
@@ -6846,7 +6598,6 @@ static void hpsa_monitor_ctlr_worker(struct work_struct *work)
 
        if (hpsa_ctlr_needs_rescan(h) || hpsa_offline_devices_ready(h)) {
                scsi_host_get(h->scsi_host);
-               h->drv_req_rescan = 0;
                hpsa_ack_ctlr_events(h);
                hpsa_scan_start(h->scsi_host);
                scsi_host_put(h->scsi_host);
@@ -6898,14 +6649,18 @@ reinit_after_soft_reset:
 
        h->pdev = pdev;
        h->intr_mode = hpsa_simple_mode ? SIMPLE_MODE_INT : PERF_MODE_INT;
-       INIT_LIST_HEAD(&h->cmpQ);
-       INIT_LIST_HEAD(&h->reqQ);
        INIT_LIST_HEAD(&h->offline_device_list);
        spin_lock_init(&h->lock);
        spin_lock_init(&h->offline_device_lock);
        spin_lock_init(&h->scan_lock);
        spin_lock_init(&h->passthru_count_lock);
 
+       h->resubmit_wq = alloc_workqueue("hpsa", WQ_MEM_RECLAIM, 0);
+       if (!h->resubmit_wq) {
+               dev_err(&h->pdev->dev, "Failed to allocate work queue\n");
+               rc = -ENOMEM;
+               goto clean1;
+       }
        /* Allocate and clear per-cpu variable lockup_detected */
        h->lockup_detected = alloc_percpu(u32);
        if (!h->lockup_detected) {
@@ -6939,13 +6694,14 @@ reinit_after_soft_reset:
        /* make sure the board interrupts are off */
        h->access.set_intr_mask(h, HPSA_INTR_OFF);
 
-       if (hpsa_request_irq(h, do_hpsa_intr_msi, do_hpsa_intr_intx))
+       if (hpsa_request_irqs(h, do_hpsa_intr_msi, do_hpsa_intr_intx))
                goto clean2;
        dev_info(&pdev->dev, "%s: <0x%x> at IRQ %d%s using DAC\n",
               h->devname, pdev->device,
               h->intr[h->intr_mode], dac ? "" : " not");
-       if (hpsa_allocate_cmd_pool(h))
-               goto clean4;
+       rc = hpsa_allocate_cmd_pool(h);
+       if (rc)
+               goto clean2_and_free_irqs;
        if (hpsa_allocate_sg_chain_blocks(h))
                goto clean4;
        init_waitqueue_head(&h->scan_wait_queue);
@@ -6974,12 +6730,12 @@ reinit_after_soft_reset:
                spin_lock_irqsave(&h->lock, flags);
                h->access.set_intr_mask(h, HPSA_INTR_OFF);
                spin_unlock_irqrestore(&h->lock, flags);
-               free_irqs(h);
-               rc = hpsa_request_irq(h, hpsa_msix_discard_completions,
+               hpsa_free_irqs(h);
+               rc = hpsa_request_irqs(h, hpsa_msix_discard_completions,
                                        hpsa_intx_discard_completions);
                if (rc) {
-                       dev_warn(&h->pdev->dev, "Failed to request_irq after "
-                               "soft reset.\n");
+                       dev_warn(&h->pdev->dev,
+                               "Failed to request_irq after soft reset.\n");
                        goto clean4;
                }
 
@@ -7016,7 +6772,6 @@ reinit_after_soft_reset:
                /* Enable Accelerated IO path at driver layer */
                h->acciopath_status = 1;
 
-       h->drv_req_rescan = 0;
 
        /* Turn the interrupts on so we can service requests */
        h->access.set_intr_mask(h, HPSA_INTR_ON);
@@ -7034,9 +6789,12 @@ reinit_after_soft_reset:
 clean4:
        hpsa_free_sg_chain_blocks(h);
        hpsa_free_cmd_pool(h);
-       free_irqs(h);
+clean2_and_free_irqs:
+       hpsa_free_irqs(h);
 clean2:
 clean1:
+       if (h->resubmit_wq)
+               destroy_workqueue(h->resubmit_wq);
        if (h->lockup_detected)
                free_percpu(h->lockup_detected);
        kfree(h);
@@ -7055,9 +6813,9 @@ static void hpsa_flush_cache(struct ctlr_info *h)
        if (!flush_buf)
                return;
 
-       c = cmd_special_alloc(h);
+       c = cmd_alloc(h);
        if (!c) {
-               dev_warn(&h->pdev->dev, "cmd_special_alloc returned NULL!\n");
+               dev_warn(&h->pdev->dev, "cmd_alloc returned NULL!\n");
                goto out_of_memory;
        }
        if (fill_cmd(c, HPSA_CACHE_FLUSH, h, flush_buf, 4, 0,
@@ -7069,7 +6827,7 @@ static void hpsa_flush_cache(struct ctlr_info *h)
 out:
                dev_warn(&h->pdev->dev,
                        "error flushing cache on controller\n");
-       cmd_special_free(h, c);
+       cmd_free(h, c);
 out_of_memory:
        kfree(flush_buf);
 }
@@ -7112,9 +6870,9 @@ static void hpsa_remove_one(struct pci_dev *pdev)
        h->remove_in_progress = 1;
        cancel_delayed_work(&h->monitor_ctlr_work);
        spin_unlock_irqrestore(&h->lock, flags);
-
        hpsa_unregister_scsi(h);        /* unhook from SCSI subsystem */
        hpsa_shutdown(pdev);
+       destroy_workqueue(h->resubmit_wq);
        iounmap(h->vaddr);
        iounmap(h->transtable);
        iounmap(h->cfgtable);
@@ -7172,7 +6930,7 @@ static struct pci_driver hpsa_pci_driver = {
  * bits of the command address.
  */
 static void  calc_bucket_map(int bucket[], int num_buckets,
-       int nsgs, int min_blocks, int *bucket_map)
+       int nsgs, int min_blocks, u32 *bucket_map)
 {
        int i, j, b, size;
 
@@ -7288,8 +7046,8 @@ static void hpsa_enter_performant_mode(struct ctlr_info *h, u32 trans_support)
        hpsa_wait_for_mode_change_ack(h);
        register_value = readl(&(h->cfgtable->TransportActive));
        if (!(register_value & CFGTBL_Trans_Performant)) {
-               dev_warn(&h->pdev->dev, "unable to get board into"
-                                       " performant mode\n");
+               dev_err(&h->pdev->dev,
+                       "performant mode problem - transport not active\n");
                return;
        }
        /* Change the access methods to the performant access methods */
@@ -7328,12 +7086,12 @@ static void hpsa_enter_performant_mode(struct ctlr_info *h, u32 trans_support)
                                        (i * sizeof(struct ErrorInfo)));
                        cp->err_info_len = sizeof(struct ErrorInfo);
                        cp->sgl_offset = IOACCEL1_SGLOFFSET;
-                       cp->host_context_flags = IOACCEL1_HCFLAGS_CISS_FORMAT;
+                       cp->host_context_flags =
+                               cpu_to_le16(IOACCEL1_HCFLAGS_CISS_FORMAT);
                        cp->timeout_sec = 0;
                        cp->ReplyQueue = 0;
                        cp->tag =
-                               cpu_to_le64((i << DIRECT_LOOKUP_SHIFT) |
-                                               DIRECT_LOOKUP_BIT);
+                               cpu_to_le64((i << DIRECT_LOOKUP_SHIFT));
                        cp->host_addr =
                                cpu_to_le64(h->ioaccel_cmd_pool_dhandle +
                                        (i * sizeof(struct io_accel1_cmd)));
@@ -7508,19 +7266,19 @@ static int is_accelerated_cmd(struct CommandList *c)
 static void hpsa_drain_accel_commands(struct ctlr_info *h)
 {
        struct CommandList *c = NULL;
-       unsigned long flags;
-       int accel_cmds_out;
+       int i, accel_cmds_out;
 
-       do { /* wait for all outstanding commands to drain out */
+       do { /* wait for all outstanding ioaccel commands to drain out */
                accel_cmds_out = 0;
-               spin_lock_irqsave(&h->lock, flags);
-               list_for_each_entry(c, &h->cmpQ, list)
-                       accel_cmds_out += is_accelerated_cmd(c);
-               list_for_each_entry(c, &h->reqQ, list)
+               for (i = 0; i < h->nr_cmds; i++) {
+                       if (!test_bit(i & (BITS_PER_LONG - 1),
+                                       h->cmd_pool_bits + (i / BITS_PER_LONG)))
+                               continue;
+                       c = h->cmd_pool + i;
                        accel_cmds_out += is_accelerated_cmd(c);
-               spin_unlock_irqrestore(&h->lock, flags);
+               }
                if (accel_cmds_out <= 0)
-                       break;
+                               break;
                msleep(100);
        } while (1);
 }