On Tue, Mar 17, 2026 at 12:07:02PM +0000, John Garry wrote:
> Switch to use core scsi ALUA support.
> 
> We still need to drive the state machine for explicit ALUA.
> 
> Signed-off-by: John Garry <[email protected]>
> ---
>  drivers/scsi/device_handler/scsi_dh_alua.c | 580 +--------------------
>  1 file changed, 21 insertions(+), 559 deletions(-)
> 
> diff --git a/drivers/scsi/device_handler/scsi_dh_alua.c 
> b/drivers/scsi/device_handler/scsi_dh_alua.c
> index 067021fffc16f..4d53fab85a7ed 100644
> --- a/drivers/scsi/device_handler/scsi_dh_alua.c
> +++ b/drivers/scsi/device_handler/scsi_dh_alua.c
> @@ -10,6 +10,7 @@
>  #include <linux/module.h>
>  #include <linux/unaligned.h>
>  #include <scsi/scsi.h>
> +#include <scsi/scsi_alua.h>
>  #include <scsi/scsi_proto.h>
>  #include <scsi/scsi_dbg.h>
>  #include <scsi/scsi_eh.h>
> @@ -44,7 +45,6 @@
>  
>  /* device handler flags */
>  #define ALUA_OPTIMIZE_STPG           0x01
> -#define ALUA_RTPG_EXT_HDR_UNSUPP     0x02
>  /* State machine flags */
>  #define ALUA_PG_RUN_RTPG             0x10
>  #define ALUA_PG_RUN_STPG             0x20
> @@ -65,14 +65,6 @@ struct alua_dh_data {
>       unsigned                flags; /* used for optimizing STPG */
>       spinlock_t              lock;
>  
> -     /* alua stuff */
> -     int                     state;
> -     int                     pref;
> -     int                     valid_states;
> -     int                     tpgs;
> -     unsigned char           transition_tmo;
> -     unsigned long           expiry;
> -     unsigned long           interval;
>       struct delayed_work     rtpg_work;
>       struct list_head        rtpg_list;
>  };
> @@ -91,121 +83,6 @@ static bool alua_rtpg_queue(struct scsi_device *sdev,
>                           struct alua_queue_data *qdata, bool force);
>  static void alua_check(struct scsi_device *sdev, bool force);
>  
> -/*
> - * submit_rtpg - Issue a REPORT TARGET GROUP STATES command
> - * @sdev: sdev the command should be sent to
> - */
> -static int submit_rtpg(struct scsi_device *sdev, unsigned char *buff,
> -                    int bufflen, struct scsi_sense_hdr *sshdr, int flags)
> -{
> -     u8 cdb[MAX_COMMAND_SIZE];
> -     blk_opf_t opf = REQ_OP_DRV_IN | REQ_FAILFAST_DEV |
> -                             REQ_FAILFAST_TRANSPORT | REQ_FAILFAST_DRIVER;
> -     const struct scsi_exec_args exec_args = {
> -             .sshdr = sshdr,
> -     };
> -
> -     /* Prepare the command. */
> -     memset(cdb, 0x0, MAX_COMMAND_SIZE);
> -     cdb[0] = MAINTENANCE_IN;
> -     if (!(flags & ALUA_RTPG_EXT_HDR_UNSUPP))
> -             cdb[1] = MI_REPORT_TARGET_PGS | MI_EXT_HDR_PARAM_FMT;
> -     else
> -             cdb[1] = MI_REPORT_TARGET_PGS;
> -     put_unaligned_be32(bufflen, &cdb[6]);
> -
> -     return scsi_execute_cmd(sdev, cdb, opf, buff, bufflen,
> -                             ALUA_FAILOVER_TIMEOUT * HZ,
> -                             ALUA_FAILOVER_RETRIES, &exec_args);
> -}
> -
> -/*
> - * submit_stpg - Issue a SET TARGET PORT GROUP command
> - *
> - * Currently we're only setting the current target port group state
> - * to 'active/optimized' and let the array firmware figure out
> - * the states of the remaining groups.
> - */
> -static int submit_stpg(struct scsi_device *sdev, int group_id,
> -                    struct scsi_sense_hdr *sshdr)
> -{
> -     u8 cdb[MAX_COMMAND_SIZE];
> -     unsigned char stpg_data[8];
> -     int stpg_len = 8;
> -     blk_opf_t opf = REQ_OP_DRV_OUT | REQ_FAILFAST_DEV |
> -                             REQ_FAILFAST_TRANSPORT | REQ_FAILFAST_DRIVER;
> -     const struct scsi_exec_args exec_args = {
> -             .sshdr = sshdr,
> -     };
> -
> -     /* Prepare the data buffer */
> -     memset(stpg_data, 0, stpg_len);
> -     stpg_data[4] = SCSI_ACCESS_STATE_OPTIMAL;
> -     put_unaligned_be16(group_id, &stpg_data[6]);
> -
> -     /* Prepare the command. */
> -     memset(cdb, 0x0, MAX_COMMAND_SIZE);
> -     cdb[0] = MAINTENANCE_OUT;
> -     cdb[1] = MO_SET_TARGET_PGS;
> -     put_unaligned_be32(stpg_len, &cdb[6]);
> -
> -     return scsi_execute_cmd(sdev, cdb, opf, stpg_data,
> -                             stpg_len, ALUA_FAILOVER_TIMEOUT * HZ,
> -                             ALUA_FAILOVER_RETRIES, &exec_args);
> -}
> -
> -/*
> - * alua_check_tpgs - Evaluate TPGS setting
> - * @sdev: device to be checked
> - *
> - * Examine the TPGS setting of the sdev to find out if ALUA
> - * is supported.
> - */
> -static int alua_check_tpgs(struct scsi_device *sdev)
> -{
> -     int tpgs = TPGS_MODE_NONE;
> -
> -     /*
> -      * ALUA support for non-disk devices is fraught with
> -      * difficulties, so disable it for now.
> -      */
> -     if (sdev->type != TYPE_DISK) {
> -             sdev_printk(KERN_INFO, sdev,
> -                         "%s: disable for non-disk devices\n",
> -                         ALUA_DH_NAME);
> -             return tpgs;
> -     }
> -
> -     tpgs = scsi_device_tpgs(sdev);
> -     switch (tpgs) {
> -     case TPGS_MODE_EXPLICIT|TPGS_MODE_IMPLICIT:
> -             sdev_printk(KERN_INFO, sdev,
> -                         "%s: supports implicit and explicit TPGS\n",
> -                         ALUA_DH_NAME);
> -             break;
> -     case TPGS_MODE_EXPLICIT:
> -             sdev_printk(KERN_INFO, sdev, "%s: supports explicit TPGS\n",
> -                         ALUA_DH_NAME);
> -             break;
> -     case TPGS_MODE_IMPLICIT:
> -             sdev_printk(KERN_INFO, sdev, "%s: supports implicit TPGS\n",
> -                         ALUA_DH_NAME);
> -             break;
> -     case TPGS_MODE_NONE:
> -             sdev_printk(KERN_INFO, sdev, "%s: not supported\n",
> -                         ALUA_DH_NAME);
> -             break;
> -     default:
> -             sdev_printk(KERN_INFO, sdev,
> -                         "%s: unsupported TPGS setting %d\n",
> -                         ALUA_DH_NAME, tpgs);
> -             tpgs = TPGS_MODE_NONE;
> -             break;
> -     }
> -
> -     return tpgs;
> -}
> -
>  /*
>   * alua_check_vpd - Evaluate INQUIRY vpd page 0x83
>   * @sdev: device to be checked
> @@ -216,56 +93,11 @@ static int alua_check_tpgs(struct scsi_device *sdev)
>  static int alua_check_vpd(struct scsi_device *sdev, struct alua_dh_data *h,
>                         int tpgs)
>  {
> -     int rel_port = -1;
> -
> -     h->group_id = scsi_vpd_tpg_id(sdev, &rel_port);
> -     if (h->group_id < 0) {
> -             /*
> -              * Internal error; TPGS supported but required
> -              * VPD identification descriptors not present.
> -              * Disable ALUA support
> -              */
> -             sdev_printk(KERN_INFO, sdev,
> -                         "%s: No target port descriptors found\n",
> -                         ALUA_DH_NAME);
> -             return SCSI_DH_DEV_UNSUPP;
> -     }
> -     h->tpgs = tpgs;
> -
>       alua_rtpg_queue(sdev, NULL, true);
>  
>       return SCSI_DH_OK;
>  }
>  
> -static char print_alua_state(unsigned char state)
> -{
> -     switch (state) {
> -     case SCSI_ACCESS_STATE_OPTIMAL:
> -             return 'A';
> -     case SCSI_ACCESS_STATE_ACTIVE:
> -             return 'N';
> -     case SCSI_ACCESS_STATE_STANDBY:
> -             return 'S';
> -     case SCSI_ACCESS_STATE_UNAVAILABLE:
> -             return 'U';
> -     case SCSI_ACCESS_STATE_LBA:
> -             return 'L';
> -     case SCSI_ACCESS_STATE_OFFLINE:
> -             return 'O';
> -     case SCSI_ACCESS_STATE_TRANSITIONING:
> -             return 'T';
> -     default:
> -             return 'X';
> -     }
> -}
> -
> -static void alua_handle_state_transition(struct scsi_device *sdev)
> -{
> -     struct alua_dh_data *h = sdev->handler_data;
> -
> -     h->state = SCSI_ACCESS_STATE_TRANSITIONING;
> -}
> -
>  static enum scsi_disposition alua_check_sense(struct scsi_device *sdev,
>                                             struct scsi_sense_hdr *sense_hdr)
>  {
> @@ -275,7 +107,7 @@ static enum scsi_disposition alua_check_sense(struct 
> scsi_device *sdev,
>                       /*
>                        * LUN Not Accessible - ALUA state transition
>                        */
> -                     alua_handle_state_transition(sdev);
> +                     scsi_alua_handle_state_transition(sdev);
>                       return NEEDS_RETRY;
>               }
>               break;
> @@ -284,7 +116,7 @@ static enum scsi_disposition alua_check_sense(struct 
> scsi_device *sdev,
>                       /*
>                        * LUN Not Accessible - ALUA state transition
>                        */
> -                     alua_handle_state_transition(sdev);
> +                     scsi_alua_handle_state_transition(sdev);
>                       return NEEDS_RETRY;
>               }
>               if (sense_hdr->asc == 0x29 && sense_hdr->ascq == 0x00) {
> @@ -338,329 +170,6 @@ static enum scsi_disposition alua_check_sense(struct 
> scsi_device *sdev,
>       return SCSI_RETURN_NOT_HANDLED;
>  }
>  
> -/*
> - * alua_tur - Send a TEST UNIT READY
> - * @sdev: device to which the TEST UNIT READY command should be send
> - *
> - * Send a TEST UNIT READY to @sdev to figure out the device state
> - * Returns SCSI_DH_RETRY if the sense code is NOT READY/ALUA TRANSITIONING,
> - * SCSI_DH_OK if no error occurred, and SCSI_DH_IO otherwise.
> - */
> -static int alua_tur(struct scsi_device *sdev)
> -{
> -     struct scsi_sense_hdr sense_hdr;
> -     int retval;
> -
> -     retval = scsi_test_unit_ready(sdev, ALUA_FAILOVER_TIMEOUT * HZ,
> -                                   ALUA_FAILOVER_RETRIES, &sense_hdr);
> -     if ((sense_hdr.sense_key == NOT_READY ||
> -          sense_hdr.sense_key == UNIT_ATTENTION) &&
> -         sense_hdr.asc == 0x04 && sense_hdr.ascq == 0x0a)
> -             return SCSI_DH_RETRY;
> -     else if (retval)
> -             return SCSI_DH_IO;
> -     else
> -             return SCSI_DH_OK;
> -}
> -
> -/*
> - * alua_rtpg - Evaluate REPORT TARGET GROUP STATES
> - * @sdev: the device to be evaluated.
> - *
> - * Evaluate the Target Port Group State.
> - * Returns SCSI_DH_DEV_OFFLINED if the path is
> - * found to be unusable.
> - */
> -static int alua_rtpg(struct scsi_device *sdev)
> -{
> -     struct scsi_sense_hdr sense_hdr;
> -     struct alua_dh_data *h = sdev->handler_data;
> -     int len, k, off, bufflen = ALUA_RTPG_SIZE;
> -     int group_id_old, state_old, pref_old, valid_states_old;
> -     unsigned char *desc, *buff;
> -     unsigned err;
> -     int retval;
> -     unsigned int tpg_desc_tbl_off;
> -     unsigned char orig_transition_tmo;
> -     unsigned long flags;
> -     bool transitioning_sense = false;
> -     int rel_port, group_id = scsi_vpd_tpg_id(sdev, &rel_port);
> -
> -     if (group_id < 0) {
> -             /*
> -              * Internal error; TPGS supported but required
> -              * VPD identification descriptors not present.
> -              * Disable ALUA support
> -              */
> -             sdev_printk(KERN_INFO, sdev,
> -                         "%s: No target port descriptors found\n",
> -                         ALUA_DH_NAME);
> -             return SCSI_DH_DEV_UNSUPP;
> -     }
> -
> -     group_id_old = h->group_id;
> -     state_old = h->state;
> -     pref_old = h->pref;
> -     valid_states_old = h->valid_states;
> -
> -     if (!h->expiry) {
> -             unsigned long transition_tmo = ALUA_FAILOVER_TIMEOUT * HZ;
> -
> -             if (h->transition_tmo)
> -                     transition_tmo = h->transition_tmo * HZ;
> -
> -             h->expiry = round_jiffies_up(jiffies + transition_tmo);
> -     }
> -
> -     buff = kzalloc(bufflen, GFP_KERNEL);
> -     if (!buff)
> -             return SCSI_DH_DEV_TEMP_BUSY;
> -
> - retry:
> -     err = 0;
> -     retval = submit_rtpg(sdev, buff, bufflen, &sense_hdr, h->flags);
> -
> -     if (retval) {
> -             /*
> -              * Some (broken) implementations have a habit of returning
> -              * an error during things like firmware update etc.
> -              * But if the target only supports active/optimized there's
> -              * not much we can do; it's not that we can switch paths
> -              * or anything.
> -              * So ignore any errors to avoid spurious failures during
> -              * path failover.
> -              */
> -             if ((h->valid_states & ~TPGS_SUPPORT_OPTIMIZED) == 0) {
> -                     sdev_printk(KERN_INFO, sdev,
> -                                 "%s: ignoring rtpg result %d\n",
> -                                 ALUA_DH_NAME, retval);
> -                     kfree(buff);
> -                     return SCSI_DH_OK;
> -             }
> -             if (retval < 0 || !scsi_sense_valid(&sense_hdr)) {
> -                     sdev_printk(KERN_INFO, sdev,
> -                                 "%s: rtpg failed, result %d\n",
> -                                 ALUA_DH_NAME, retval);
> -                     kfree(buff);
> -                     if (retval < 0)
> -                             return SCSI_DH_DEV_TEMP_BUSY;
> -                     if (host_byte(retval) == DID_NO_CONNECT)
> -                             return SCSI_DH_RES_TEMP_UNAVAIL;
> -                     return SCSI_DH_IO;
> -             }
> -
> -             /*
> -              * submit_rtpg() has failed on existing arrays
> -              * when requesting extended header info, and
> -              * the array doesn't support extended headers,
> -              * even though it shouldn't according to T10.
> -              * The retry without rtpg_ext_hdr_req set
> -              * handles this.
> -              * Note:  some arrays return a sense key of ILLEGAL_REQUEST
> -              * with ASC 00h if they don't support the extended header.
> -              */
> -             if (!(h->flags & ALUA_RTPG_EXT_HDR_UNSUPP) &&
> -                 sense_hdr.sense_key == ILLEGAL_REQUEST) {
> -                     h->flags |= ALUA_RTPG_EXT_HDR_UNSUPP;
> -                     goto retry;
> -             }
> -             /*
> -              * If the array returns with 'ALUA state transition'
> -              * sense code here it cannot return RTPG data during
> -              * transition. So set the state to 'transitioning' directly.
> -              */
> -             if (sense_hdr.sense_key == NOT_READY &&
> -                 sense_hdr.asc == 0x04 && sense_hdr.ascq == 0x0a) {
> -                     transitioning_sense = true;
> -                     goto skip_rtpg;
> -             }
> -             /*
> -              * Retry on any other UNIT ATTENTION occurred.
> -              */
> -             if (sense_hdr.sense_key == UNIT_ATTENTION)
> -                     err = SCSI_DH_RETRY;
> -             if (err == SCSI_DH_RETRY &&
> -                 h->expiry != 0 && time_before(jiffies, h->expiry)) {
> -                     sdev_printk(KERN_ERR, sdev, "%s: rtpg retry\n",
> -                                 ALUA_DH_NAME);
> -                     scsi_print_sense_hdr(sdev, ALUA_DH_NAME, &sense_hdr);
> -                     kfree(buff);
> -                     return err;
> -             }
> -             sdev_printk(KERN_ERR, sdev, "%s: rtpg failed\n",
> -                         ALUA_DH_NAME);
> -             scsi_print_sense_hdr(sdev, ALUA_DH_NAME, &sense_hdr);
> -             kfree(buff);
> -             h->expiry = 0;
> -             return SCSI_DH_IO;
> -     }
> -
> -     len = get_unaligned_be32(&buff[0]) + 4;
> -
> -     if (len > bufflen) {
> -             /* Resubmit with the correct length */
> -             kfree(buff);
> -             bufflen = len;
> -             buff = kmalloc(bufflen, GFP_KERNEL);
> -             if (!buff) {
> -                     sdev_printk(KERN_WARNING, sdev,
> -                                 "%s: kmalloc buffer failed\n",__func__);
> -                     /* Temporary failure, bypass */
> -                     h->expiry = 0;
> -                     return SCSI_DH_DEV_TEMP_BUSY;
> -             }
> -             goto retry;
> -     }
> -
> -     orig_transition_tmo = h->transition_tmo;
> -     if ((buff[4] & RTPG_FMT_MASK) == RTPG_FMT_EXT_HDR && buff[5] != 0)
> -             h->transition_tmo = buff[5];
> -     else
> -             h->transition_tmo = ALUA_FAILOVER_TIMEOUT;
> -
> -     if (orig_transition_tmo != h->transition_tmo) {
> -             sdev_printk(KERN_INFO, sdev,
> -                         "%s: transition timeout set to %d seconds\n",
> -                         ALUA_DH_NAME, h->transition_tmo);
> -             h->expiry = jiffies + h->transition_tmo * HZ;
> -     }
> -
> -     if ((buff[4] & RTPG_FMT_MASK) == RTPG_FMT_EXT_HDR)
> -             tpg_desc_tbl_off = 8;
> -     else
> -             tpg_desc_tbl_off = 4;
> -
> -     for (k = tpg_desc_tbl_off, desc = buff + tpg_desc_tbl_off;
> -          k < len;
> -          k += off, desc += off) {
> -             u16 group_id_desc = get_unaligned_be16(&desc[2]);
> -
> -             spin_lock_irqsave(&h->lock, flags);
> -             if (group_id_desc == group_id) {
> -                     h->group_id = group_id;
> -                     WRITE_ONCE(h->state, desc[0] & 0x0f);
> -                     h->pref = desc[0] >> 7;
> -                     WRITE_ONCE(sdev->access_state, desc[0]);
> -                     h->valid_states = desc[1];
> -             }
> -             spin_unlock_irqrestore(&h->lock, flags);
> -             off = 8 + (desc[7] * 4);
> -     }
> -
> - skip_rtpg:
> -     spin_lock_irqsave(&h->lock, flags);
> -     if (transitioning_sense)
> -             h->state = SCSI_ACCESS_STATE_TRANSITIONING;
> -
> -     if (group_id_old != h->group_id || state_old != h->state ||
> -             pref_old != h->pref || valid_states_old != h->valid_states)
> -             sdev_printk(KERN_INFO, sdev,
> -                     "%s: port group %02x state %c %s supports 
> %c%c%c%c%c%c%c\n",
> -                     ALUA_DH_NAME, h->group_id, print_alua_state(h->state),
> -                     h->pref ? "preferred" : "non-preferred",
> -                     h->valid_states&TPGS_SUPPORT_TRANSITION?'T':'t',
> -                     h->valid_states&TPGS_SUPPORT_OFFLINE?'O':'o',
> -                     h->valid_states&TPGS_SUPPORT_LBA_DEPENDENT?'L':'l',
> -                     h->valid_states&TPGS_SUPPORT_UNAVAILABLE?'U':'u',
> -                     h->valid_states&TPGS_SUPPORT_STANDBY?'S':'s',
> -                     h->valid_states&TPGS_SUPPORT_NONOPTIMIZED?'N':'n',
> -                     h->valid_states&TPGS_SUPPORT_OPTIMIZED?'A':'a');
> -
> -     switch (h->state) {
> -     case SCSI_ACCESS_STATE_TRANSITIONING:
> -             if (time_before(jiffies, h->expiry)) {
> -                     /* State transition, retry */
> -                     h->interval = ALUA_RTPG_RETRY_DELAY;
> -                     err = SCSI_DH_RETRY;
> -             } else {
> -                     struct alua_dh_data *h;
> -                     unsigned char access_state;
> -
> -                     /* Transitioning time exceeded, set port to standby */
> -                     err = SCSI_DH_IO;
> -                     h->state = SCSI_ACCESS_STATE_STANDBY;
> -                     h->expiry = 0;
> -                     access_state = h->state & SCSI_ACCESS_STATE_MASK;
> -                     if (h->pref)
> -                             access_state |= SCSI_ACCESS_STATE_PREFERRED;
> -                     WRITE_ONCE(sdev->access_state, access_state);
> -             }
> -             break;
> -     case SCSI_ACCESS_STATE_OFFLINE:
> -             /* Path unusable */
> -             err = SCSI_DH_DEV_OFFLINED;
> -             h->expiry = 0;
> -             break;
> -     default:
> -             /* Useable path if active */
> -             err = SCSI_DH_OK;
> -             h->expiry = 0;
> -             break;
> -     }
> -     spin_unlock_irqrestore(&h->lock, flags);
> -     kfree(buff);
> -     return err;
> -}
> -
> -/*
> - * alua_stpg - Issue a SET TARGET PORT GROUP command
> - *
> - * Issue a SET TARGET PORT GROUP command and evaluate the
> - * response. Returns SCSI_DH_RETRY per default to trigger
> - * a re-evaluation of the target group state or SCSI_DH_OK
> - * if no further action needs to be taken.
> - */
> -static unsigned alua_stpg(struct scsi_device *sdev)
> -{
> -     int retval;
> -     struct scsi_sense_hdr sense_hdr;
> -     struct alua_dh_data *h = sdev->handler_data;
> -
> -     if (!(h->tpgs & TPGS_MODE_EXPLICIT)) {
> -             /* Only implicit ALUA supported, retry */
> -             return SCSI_DH_RETRY;
> -     }
> -     switch (h->state) {
> -     case SCSI_ACCESS_STATE_OPTIMAL:
> -             return SCSI_DH_OK;
> -     case SCSI_ACCESS_STATE_ACTIVE:
> -             if ((h->flags & ALUA_OPTIMIZE_STPG) &&
> -                 !h->pref &&
> -                 (h->tpgs & TPGS_MODE_IMPLICIT))
> -                     return SCSI_DH_OK;
> -             break;
> -     case SCSI_ACCESS_STATE_STANDBY:
> -     case SCSI_ACCESS_STATE_UNAVAILABLE:
> -             break;
> -     case SCSI_ACCESS_STATE_OFFLINE:
> -             return SCSI_DH_IO;
> -     case SCSI_ACCESS_STATE_TRANSITIONING:
> -             break;
> -     default:
> -             sdev_printk(KERN_INFO, sdev,
> -                         "%s: stpg failed, unhandled TPGS state %d",
> -                         ALUA_DH_NAME, h->state);
> -             return SCSI_DH_NOSYS;
> -     }
> -     retval = submit_stpg(sdev, h->group_id, &sense_hdr);
> -
> -     if (retval) {
> -             if (retval < 0 || !scsi_sense_valid(&sense_hdr)) {
> -                     sdev_printk(KERN_INFO, sdev,
> -                                 "%s: stpg failed, result %d",
> -                                 ALUA_DH_NAME, retval);
> -                     if (retval < 0)
> -                             return SCSI_DH_DEV_TEMP_BUSY;
> -             } else {
> -                     sdev_printk(KERN_INFO, sdev, "%s: stpg failed\n",
> -                                 ALUA_DH_NAME);
> -                     scsi_print_sense_hdr(sdev, ALUA_DH_NAME, &sense_hdr);
> -             }
> -     }
> -     /* Retry RTPG */
> -     return SCSI_DH_RETRY;
> -}
> -
>  static void alua_rtpg_work(struct work_struct *work)
>  {
>       struct alua_dh_data *h =
> @@ -670,56 +179,41 @@ static void alua_rtpg_work(struct work_struct *work)
>       int err = SCSI_DH_OK;
>       struct alua_queue_data *qdata, *tmp;
>       unsigned long flags;
> +     int ret;
>  
>       spin_lock_irqsave(&h->lock, flags);
>       h->flags |= ALUA_PG_RUNNING;
>       if (h->flags & ALUA_PG_RUN_RTPG) {
> -             int state = h->state;
>  
>               h->flags &= ~ALUA_PG_RUN_RTPG;
>               spin_unlock_irqrestore(&h->lock, flags);
> -             if (state == SCSI_ACCESS_STATE_TRANSITIONING) {
> -                     if (alua_tur(sdev) == SCSI_DH_RETRY) {
> -                             spin_lock_irqsave(&h->lock, flags);
> -                             h->flags &= ~ALUA_PG_RUNNING;
> -                             h->flags |= ALUA_PG_RUN_RTPG;
> -                             if (!h->interval)
> -                                     h->interval = ALUA_RTPG_RETRY_DELAY;
> -                             spin_unlock_irqrestore(&h->lock, flags);
> -                             queue_delayed_work(kaluad_wq, &h->rtpg_work,
> -                                                h->interval * HZ);
> -                             return;
> -                     }
> -                     /* Send RTPG on failure or if TUR indicates SUCCESS */
> -             }
> -             err = alua_rtpg(sdev);
> -             spin_lock_irqsave(&h->lock, flags);
> -
> -             if (err == SCSI_DH_RETRY || h->flags & ALUA_PG_RUN_RTPG) {
> +             ret = scsi_alua_rtpg_run(sdev);
> +             if (ret == -EAGAIN) {

This no longer handles the case where you want to trigger a new rtpg as
soon as the running one finishes. I think it should be checking
(ret == -EAGAIN || h->flags & ALUA_PG_RUN_RTPG)
with a spinlock held.

> +                     spin_lock_irqsave(&h->lock, flags);
>                       h->flags &= ~ALUA_PG_RUNNING;
> -                     if (err == SCSI_DH_IMM_RETRY)
> -                             h->interval = 0;
> -                     else if (!h->interval && !(h->flags & ALUA_PG_RUN_RTPG))
> -                             h->interval = ALUA_RTPG_RETRY_DELAY;
>                       h->flags |= ALUA_PG_RUN_RTPG;
>                       spin_unlock_irqrestore(&h->lock, flags);
> -                     goto queue_rtpg;
> +                     queue_delayed_work(kaluad_wq, &h->rtpg_work,
> +                                                        sdev->alua->interval 
> * HZ);
> +                     return;
>               }
> -             if (err != SCSI_DH_OK)
> -                     h->flags &= ~ALUA_PG_RUN_STPG;
> +             if (err != 0)
> +                             h->flags &= ~ALUA_PG_RUN_STPG;
>       }
> +     spin_lock_irqsave(&h->lock, flags);

If h->flags & ALUA_PG_RUN_RTPG is false above, h->lock will already be
locked.

>       if (h->flags & ALUA_PG_RUN_STPG) {
>               h->flags &= ~ALUA_PG_RUN_STPG;
>               spin_unlock_irqrestore(&h->lock, flags);
> -             err = alua_stpg(sdev);
> -             spin_lock_irqsave(&h->lock, flags);
> -             if (err == SCSI_DH_RETRY || h->flags & ALUA_PG_RUN_RTPG) {
> +             ret = scsi_alua_stpg_run(sdev, h->flags & ALUA_OPTIMIZE_STPG);
> +             if (err == -EAGAIN || h->flags & ALUA_PG_RUN_RTPG) {

To avoid a race with resetting ALUA_PG_RUN_RTPG, this check needs to be
done with the spinlock held.

-Ben

> +                     spin_lock_irqsave(&h->lock, flags);
>                       h->flags |= ALUA_PG_RUN_RTPG;
> -                     h->interval = 0;
>                       h->flags &= ~ALUA_PG_RUNNING;
>                       spin_unlock_irqrestore(&h->lock, flags);
>                       goto queue_rtpg;
>               }
> +     } else {
> +             spin_unlock_irqrestore(&h->lock, flags);
>       }
>  
>       list_splice_init(&h->rtpg_list, &qdata_list);
> @@ -728,8 +222,6 @@ static void alua_rtpg_work(struct work_struct *work)
>        * Re-enable the device for the next attempt.
>        */
>       h->disabled = false;
> -     spin_unlock_irqrestore(&h->lock, flags);
> -
>  
>       list_for_each_entry_safe(qdata, tmp, &qdata_list, entry) {
>               list_del(&qdata->entry);
> @@ -745,7 +237,7 @@ static void alua_rtpg_work(struct work_struct *work)
>       return;
>  
>  queue_rtpg:
> -     queue_delayed_work(kaluad_wq, &h->rtpg_work, h->interval * HZ);
> +     queue_delayed_work(kaluad_wq, &h->rtpg_work, sdev->alua->interval * HZ);
>  }
>  
>  /**
> @@ -809,7 +301,7 @@ static int alua_initialize(struct scsi_device *sdev, 
> struct alua_dh_data *h)
>  
>       mutex_lock(&h->init_mutex);
>       h->disabled = false;
> -     tpgs = alua_check_tpgs(sdev);
> +     tpgs = scsi_alua_check_tpgs(sdev);
>       if (tpgs != TPGS_MODE_NONE)
>               err = alua_check_vpd(sdev, h, tpgs);
>       h->init_error = err;
> @@ -898,34 +390,6 @@ static void alua_check(struct scsi_device *sdev, bool 
> force)
>       alua_rtpg_queue(sdev, NULL, force);
>  }
>  
> -/*
> - * alua_prep_fn - request callback
> - *
> - * Fail I/O to all paths not in state
> - * active/optimized or active/non-optimized.
> - */
> -static blk_status_t alua_prep_fn(struct scsi_device *sdev, struct request 
> *req)
> -{
> -     struct alua_dh_data *h = sdev->handler_data;
> -     unsigned long flags;
> -     unsigned char state;
> -
> -     spin_lock_irqsave(&h->lock, flags);
> -     state = h->state;
> -     spin_unlock_irqrestore(&h->lock, flags);
> -
> -     switch (state) {
> -     case SCSI_ACCESS_STATE_OPTIMAL:
> -     case SCSI_ACCESS_STATE_ACTIVE:
> -     case SCSI_ACCESS_STATE_LBA:
> -     case SCSI_ACCESS_STATE_TRANSITIONING:
> -             return BLK_STS_OK;
> -     default:
> -             req->rq_flags |= RQF_QUIET;
> -             return BLK_STS_IOERR;
> -     }
> -}
> -
>  static void alua_rescan(struct scsi_device *sdev)
>  {
>       struct alua_dh_data *h = sdev->handler_data;
> @@ -953,8 +417,6 @@ static int alua_bus_attach(struct scsi_device *sdev)
>  
>       mutex_init(&h->init_mutex);
>  
> -     h->state = SCSI_ACCESS_STATE_OPTIMAL;
> -     h->valid_states = TPGS_SUPPORT_ALL;
>       if (optimize_stpg)
>               h->flags |= ALUA_OPTIMIZE_STPG;
>  
> @@ -986,7 +448,7 @@ static struct scsi_device_handler alua_dh = {
>       .module = THIS_MODULE,
>       .attach = alua_bus_attach,
>       .detach = alua_bus_detach,
> -     .prep_fn = alua_prep_fn,
> +     .prep_fn = scsi_alua_prep_fn,
>       .check_sense = alua_check_sense,
>       .activate = alua_activate,
>       .rescan = alua_rescan,
> -- 
> 2.43.5


Reply via email to