scsi: lpfc: Abort outstanding ELS cmds when mailbox timeout error is detected

author Justin Tee <justin.tee@broadcom.com>

Wed, 12 Jul 2023 18:05:18 +0000 (11:05 -0700)

committer Greg Kroah-Hartman <gregkh@linuxfoundation.org>

Sat, 23 Sep 2023 09:11:06 +0000 (11:11 +0200)
author Justin Tee <justin.tee@broadcom.com>
Wed, 12 Jul 2023 18:05:18 +0000 (11:05 -0700)
committer Greg Kroah-Hartman <gregkh@linuxfoundation.org>
Sat, 23 Sep 2023 09:11:06 +0000 (11:11 +0200)
diff --git a/drivers/scsi/lpfc/lpfc.h b/drivers/scsi/lpfc/lpfc.h

index 9ad233b40a9e2e660a82bd016b20f8be78ae5a6a..664ac3069c4bebe8a600d9d193ea30e17d4b383f 100644 (file)
--- a/drivers/scsi/lpfc/lpfc.h
+++ b/drivers/scsi/lpfc/lpfc.h
@@ -895,6 +895,7 @@ enum lpfc_irq_chann_mode {
  enum lpfc_hba_bit_flags {
         FABRIC_COMANDS_BLOCKED,
         HBA_PCI_ERR,
+       MBX_TMO_ERR,
  };
  
  struct lpfc_hba {
diff --git a/drivers/scsi/lpfc/lpfc_els.c b/drivers/scsi/lpfc/lpfc_els.c

index 43ebb41ded59360d43a5ca0edef669222182e8b8..6b5ce9869e6b4b5333b738330474a5ff2b377ab2 100644 (file)
--- a/drivers/scsi/lpfc/lpfc_els.c
+++ b/drivers/scsi/lpfc/lpfc_els.c
@@ -9410,11 +9410,13 @@ void
  lpfc_els_flush_cmd(struct lpfc_vport *vport)
  {
         LIST_HEAD(abort_list);
+       LIST_HEAD(cancel_list);
         struct lpfc_hba  *phba = vport->phba;
         struct lpfc_sli_ring *pring;
         struct lpfc_iocbq *tmp_iocb, *piocb;
         u32 ulp_command;
         unsigned long iflags = 0;
+       bool mbx_tmo_err;
  
         lpfc_fabric_abort_vport(vport);
  
@@ -9436,15 +9438,16 @@ lpfc_els_flush_cmd(struct lpfc_vport *vport)
         if (phba->sli_rev == LPFC_SLI_REV4)
                 spin_lock(&pring->ring_lock);
  
+       mbx_tmo_err = test_bit(MBX_TMO_ERR, &phba->bit_flags);
         /* First we need to issue aborts to outstanding cmds on txcmpl */
         list_for_each_entry_safe(piocb, tmp_iocb, &pring->txcmplq, list) {
-               if (piocb->cmd_flag & LPFC_IO_LIBDFC)
+               if (piocb->cmd_flag & LPFC_IO_LIBDFC && !mbx_tmo_err)
                         continue;
  
                 if (piocb->vport != vport)
                         continue;
  
-               if (piocb->cmd_flag & LPFC_DRIVER_ABORTED)
+               if (piocb->cmd_flag & LPFC_DRIVER_ABORTED && !mbx_tmo_err)
                         continue;
  
                 /* On the ELS ring we can have ELS_REQUESTs or
@@ -9463,8 +9466,8 @@ lpfc_els_flush_cmd(struct lpfc_vport *vport)
                          */
                         if (phba->link_state == LPFC_LINK_DOWN)
                                 piocb->cmd_cmpl = lpfc_cmpl_els_link_down;
-               }
-               if (ulp_command == CMD_GEN_REQUEST64_CR)
+               } else if (ulp_command == CMD_GEN_REQUEST64_CR ||
+                          mbx_tmo_err)
                         list_add_tail(&piocb->dlist, &abort_list);
         }
  
@@ -9476,11 +9479,19 @@ lpfc_els_flush_cmd(struct lpfc_vport *vport)
         list_for_each_entry_safe(piocb, tmp_iocb, &abort_list, dlist) {
                 spin_lock_irqsave(&phba->hbalock, iflags);
                 list_del_init(&piocb->dlist);
-               lpfc_sli_issue_abort_iotag(phba, pring, piocb, NULL);
+               if (mbx_tmo_err)
+                       list_move_tail(&piocb->list, &cancel_list);
+               else
+                       lpfc_sli_issue_abort_iotag(phba, pring, piocb, NULL);
+
                 spin_unlock_irqrestore(&phba->hbalock, iflags);
         }
-       /* Make sure HBA is alive */
-       lpfc_issue_hb_tmo(phba);
+       if (!list_empty(&cancel_list))
+               lpfc_sli_cancel_iocbs(phba, &cancel_list, IOSTAT_LOCAL_REJECT,
+                                     IOERR_SLI_ABORTED);
+       else
+               /* Make sure HBA is alive */
+               lpfc_issue_hb_tmo(phba);
  
         if (!list_empty(&abort_list))
                 lpfc_printf_vlog(vport, KERN_ERR, LOG_TRACE_EVENT,
diff --git a/drivers/scsi/lpfc/lpfc_init.c b/drivers/scsi/lpfc/lpfc_init.c

index d54fd153cb115cfdf8197195218b254bc71eb8fe..f59de61803dc820d3684b20f9856f377ebad2f21 100644 (file)
--- a/drivers/scsi/lpfc/lpfc_init.c
+++ b/drivers/scsi/lpfc/lpfc_init.c
@@ -7563,6 +7563,8 @@ lpfc_disable_pci_dev(struct lpfc_hba *phba)
  void
  lpfc_reset_hba(struct lpfc_hba *phba)
  {
+       int rc = 0;
+
         /* If resets are disabled then set error state and return. */
         if (!phba->cfg_enable_hba_reset) {
                 phba->link_state = LPFC_HBA_ERROR;
@@ -7573,13 +7575,25 @@ lpfc_reset_hba(struct lpfc_hba *phba)
         if (phba->sli.sli_flag & LPFC_SLI_ACTIVE) {
                 lpfc_offline_prep(phba, LPFC_MBX_WAIT);
         } else {
+               if (test_bit(MBX_TMO_ERR, &phba->bit_flags)) {
+                       /* Perform a PCI function reset to start from clean */
+                       rc = lpfc_pci_function_reset(phba);
+                       lpfc_els_flush_all_cmd(phba);
+               }
                 lpfc_offline_prep(phba, LPFC_MBX_NO_WAIT);
                 lpfc_sli_flush_io_rings(phba);
         }
         lpfc_offline(phba);
-       lpfc_sli_brdrestart(phba);
-       lpfc_online(phba);
-       lpfc_unblock_mgmt_io(phba);
+       clear_bit(MBX_TMO_ERR, &phba->bit_flags);
+       if (unlikely(rc)) {
+               lpfc_printf_log(phba, KERN_ERR, LOG_SLI,
+                               "8888 PCI function reset failed rc %x\n",
+                               rc);
+       } else {
+               lpfc_sli_brdrestart(phba);
+               lpfc_online(phba);
+               lpfc_unblock_mgmt_io(phba);
+       }
  }
  
  /**
diff --git a/drivers/scsi/lpfc/lpfc_sli.c b/drivers/scsi/lpfc/lpfc_sli.c

index b44bb3ae22ad9ed49da36d9cec42700ba4535267..427a6ac803e508c2b780221a633491a89962e3b7 100644 (file)
--- a/drivers/scsi/lpfc/lpfc_sli.c
+++ b/drivers/scsi/lpfc/lpfc_sli.c
@@ -3919,6 +3919,8 @@ void lpfc_poll_eratt(struct timer_list *t)
         uint64_t sli_intr, cnt;
  
         phba = from_timer(phba, t, eratt_poll);
+       if (!(phba->hba_flag & HBA_SETUP))
+               return;
  
         /* Here we will also keep track of interrupts per sec of the hba */
         sli_intr = phba->sli.slistat.sli_intr;
@@ -7712,7 +7714,9 @@ lpfc_sli4_repost_sgl_list(struct lpfc_hba *phba,
                 spin_unlock_irq(&phba->hbalock);
         } else {
                 lpfc_printf_log(phba, KERN_ERR, LOG_TRACE_EVENT,
-                               "3161 Failure to post sgl to port.\n");
+                               "3161 Failure to post sgl to port,status %x "
+                               "blkcnt %d totalcnt %d postcnt %d\n",
+                               status, block_cnt, total_cnt, post_cnt);
                 return -EIO;
         }
  
@@ -8495,6 +8499,7 @@ lpfc_sli4_hba_setup(struct lpfc_hba *phba)
                         spin_unlock_irq(&phba->hbalock);
                 }
         }
+       phba->hba_flag &= ~HBA_SETUP;
  
         lpfc_sli4_dip(phba);
  
@@ -9317,6 +9322,7 @@ lpfc_mbox_timeout_handler(struct lpfc_hba *phba)
          * would get IOCB_ERROR from lpfc_sli_issue_iocb, allowing
          * it to fail all outstanding SCSI IO.
          */
+       set_bit(MBX_TMO_ERR, &phba->bit_flags);
         spin_lock_irq(&phba->pport->work_port_lock);
         phba->pport->work_port_events &= ~WORKER_MBOX_TMO;
         spin_unlock_irq(&phba->pport->work_port_lock);
author	Justin Tee <justin.tee@broadcom.com>
	Wed, 12 Jul 2023 18:05:18 +0000 (11:05 -0700)
committer	Greg Kroah-Hartman <gregkh@linuxfoundation.org>
	Sat, 23 Sep 2023 09:11:06 +0000 (11:11 +0200)
drivers/scsi/lpfc/lpfc.h		patch \| blob \| history
drivers/scsi/lpfc/lpfc_els.c		patch \| blob \| history
drivers/scsi/lpfc/lpfc_init.c		patch \| blob \| history
drivers/scsi/lpfc/lpfc_sli.c		patch \| blob \| history