diff mbox series

scsi: pm80xx: Fix tmf task completion race condition

Message ID 20210707185945.35559-1-ipylypiv@google.com (mailing list archive)
State Accepted
Headers show
Series scsi: pm80xx: Fix tmf task completion race condition | expand

Commit Message

Igor Pylypiv July 7, 2021, 6:59 p.m. UTC
The tmf timeout timer may trigger at the same time when the response
from a controller is being handled. When this happens the sas task may
get freed before the response processing is finished.

Fix this by calling complete() only when SAS_TASK_STATE_DONE is not set.

Similar race condition was fixed in commit b90cd6f2b905
("scsi: libsas: fix a race condition when smp task timeout")

Reviewed-by: Vishakha Channapattan <vishakhavc@google.com>
Signed-off-by: Igor Pylypiv <ipylypiv@google.com>
---
 drivers/scsi/pm8001/pm8001_sas.c | 32 +++++++++++++++-----------------
 1 file changed, 15 insertions(+), 17 deletions(-)

Comments

Martin K. Petersen July 27, 2021, 3:19 a.m. UTC | #1
Jack,

> The tmf timeout timer may trigger at the same time when the response
> from a controller is being handled. When this happens the sas task may
> get freed before the response processing is finished.
>
> Fix this by calling complete() only when SAS_TASK_STATE_DONE is not set.
>
> Similar race condition was fixed in commit b90cd6f2b905
> ("scsi: libsas: fix a race condition when smp task timeout")

Please review. Thanks!
Jinpu Wang July 27, 2021, 5:19 a.m. UTC | #2
On Wed, Jul 7, 2021 at 8:59 PM Igor Pylypiv <ipylypiv@google.com> wrote:
>
> The tmf timeout timer may trigger at the same time when the response
> from a controller is being handled. When this happens the sas task may
> get freed before the response processing is finished.
>
> Fix this by calling complete() only when SAS_TASK_STATE_DONE is not set.
>
> Similar race condition was fixed in commit b90cd6f2b905
> ("scsi: libsas: fix a race condition when smp task timeout")
>
> Reviewed-by: Vishakha Channapattan <vishakhavc@google.com>
> Signed-off-by: Igor Pylypiv <ipylypiv@google.com>

Looks good to me, thx, sorry for late reply, somehow I missed it.
Acked-by: Jack Wang <jinpu.wang@ionos.com>
>
> ---
>  drivers/scsi/pm8001/pm8001_sas.c | 32 +++++++++++++++-----------------
>  1 file changed, 15 insertions(+), 17 deletions(-)
>
> diff --git a/drivers/scsi/pm8001/pm8001_sas.c b/drivers/scsi/pm8001/pm8001_sas.c
> index 6f33d821e545..1d35587c28e0 100644
> --- a/drivers/scsi/pm8001/pm8001_sas.c
> +++ b/drivers/scsi/pm8001/pm8001_sas.c
> @@ -682,8 +682,7 @@ int pm8001_dev_found(struct domain_device *dev)
>
>  void pm8001_task_done(struct sas_task *task)
>  {
> -       if (!del_timer(&task->slow_task->timer))
> -               return;
> +       del_timer(&task->slow_task->timer);
>         complete(&task->slow_task->completion);
>  }
>
> @@ -691,9 +690,14 @@ static void pm8001_tmf_timedout(struct timer_list *t)
>  {
>         struct sas_task_slow *slow = from_timer(slow, t, timer);
>         struct sas_task *task = slow->task;
> +       unsigned long flags;
>
> -       task->task_state_flags |= SAS_TASK_STATE_ABORTED;
> -       complete(&task->slow_task->completion);
> +       spin_lock_irqsave(&task->task_state_lock, flags);
> +       if (!(task->task_state_flags & SAS_TASK_STATE_DONE)) {
> +               task->task_state_flags |= SAS_TASK_STATE_ABORTED;
> +               complete(&task->slow_task->completion);
> +       }
> +       spin_unlock_irqrestore(&task->task_state_lock, flags);
>  }
>
>  #define PM8001_TASK_TIMEOUT 20
> @@ -746,13 +750,10 @@ static int pm8001_exec_internal_tmf_task(struct domain_device *dev,
>                 }
>                 res = -TMF_RESP_FUNC_FAILED;
>                 /* Even TMF timed out, return direct. */
> -               if ((task->task_state_flags & SAS_TASK_STATE_ABORTED)) {
> -                       if (!(task->task_state_flags & SAS_TASK_STATE_DONE)) {
> -                               pm8001_dbg(pm8001_ha, FAIL,
> -                                          "TMF task[%x]timeout.\n",
> -                                          tmf->tmf);
> -                               goto ex_err;
> -                       }
> +               if (task->task_state_flags & SAS_TASK_STATE_ABORTED) {
> +                       pm8001_dbg(pm8001_ha, FAIL, "TMF task[%x]timeout.\n",
> +                                  tmf->tmf);
> +                       goto ex_err;
>                 }
>
>                 if (task->task_status.resp == SAS_TASK_COMPLETE &&
> @@ -832,12 +833,9 @@ pm8001_exec_internal_task_abort(struct pm8001_hba_info *pm8001_ha,
>                 wait_for_completion(&task->slow_task->completion);
>                 res = TMF_RESP_FUNC_FAILED;
>                 /* Even TMF timed out, return direct. */
> -               if ((task->task_state_flags & SAS_TASK_STATE_ABORTED)) {
> -                       if (!(task->task_state_flags & SAS_TASK_STATE_DONE)) {
> -                               pm8001_dbg(pm8001_ha, FAIL,
> -                                          "TMF task timeout.\n");
> -                               goto ex_err;
> -                       }
> +               if (task->task_state_flags & SAS_TASK_STATE_ABORTED) {
> +                       pm8001_dbg(pm8001_ha, FAIL, "TMF task timeout.\n");
> +                       goto ex_err;
>                 }
>
>                 if (task->task_status.resp == SAS_TASK_COMPLETE &&
> --
> 2.32.0.93.g670b81a890-goog
>
Jinpu Wang July 27, 2021, 5:20 a.m. UTC | #3
Hi Martin

On Tue, Jul 27, 2021 at 5:19 AM Martin K. Petersen
<martin.petersen@oracle.com> wrote:
>
>
> Jack,
>
> > The tmf timeout timer may trigger at the same time when the response
> > from a controller is being handled. When this happens the sas task may
> > get freed before the response processing is finished.
> >
> > Fix this by calling complete() only when SAS_TASK_STATE_DONE is not set.
> >
> > Similar race condition was fixed in commit b90cd6f2b905
> > ("scsi: libsas: fix a race condition when smp task timeout")
>
> Please review. Thanks!
Sorry for the late reply, done.
>
> --
> Martin K. Petersen      Oracle Linux Engineering
Martin K. Petersen July 29, 2021, 3:37 a.m. UTC | #4
On Wed, 7 Jul 2021 11:59:45 -0700, Igor Pylypiv wrote:

> The tmf timeout timer may trigger at the same time when the response
> from a controller is being handled. When this happens the sas task may
> get freed before the response processing is finished.
> 
> Fix this by calling complete() only when SAS_TASK_STATE_DONE is not set.
> 
> Similar race condition was fixed in commit b90cd6f2b905
> ("scsi: libsas: fix a race condition when smp task timeout")

Applied to 5.14/scsi-fixes, thanks!

[1/1] scsi: pm80xx: Fix tmf task completion race condition
      https://git.kernel.org/mkp/scsi/c/d712d3fb484b
diff mbox series

Patch

diff --git a/drivers/scsi/pm8001/pm8001_sas.c b/drivers/scsi/pm8001/pm8001_sas.c
index 6f33d821e545..1d35587c28e0 100644
--- a/drivers/scsi/pm8001/pm8001_sas.c
+++ b/drivers/scsi/pm8001/pm8001_sas.c
@@ -682,8 +682,7 @@  int pm8001_dev_found(struct domain_device *dev)
 
 void pm8001_task_done(struct sas_task *task)
 {
-	if (!del_timer(&task->slow_task->timer))
-		return;
+	del_timer(&task->slow_task->timer);
 	complete(&task->slow_task->completion);
 }
 
@@ -691,9 +690,14 @@  static void pm8001_tmf_timedout(struct timer_list *t)
 {
 	struct sas_task_slow *slow = from_timer(slow, t, timer);
 	struct sas_task *task = slow->task;
+	unsigned long flags;
 
-	task->task_state_flags |= SAS_TASK_STATE_ABORTED;
-	complete(&task->slow_task->completion);
+	spin_lock_irqsave(&task->task_state_lock, flags);
+	if (!(task->task_state_flags & SAS_TASK_STATE_DONE)) {
+		task->task_state_flags |= SAS_TASK_STATE_ABORTED;
+		complete(&task->slow_task->completion);
+	}
+	spin_unlock_irqrestore(&task->task_state_lock, flags);
 }
 
 #define PM8001_TASK_TIMEOUT 20
@@ -746,13 +750,10 @@  static int pm8001_exec_internal_tmf_task(struct domain_device *dev,
 		}
 		res = -TMF_RESP_FUNC_FAILED;
 		/* Even TMF timed out, return direct. */
-		if ((task->task_state_flags & SAS_TASK_STATE_ABORTED)) {
-			if (!(task->task_state_flags & SAS_TASK_STATE_DONE)) {
-				pm8001_dbg(pm8001_ha, FAIL,
-					   "TMF task[%x]timeout.\n",
-					   tmf->tmf);
-				goto ex_err;
-			}
+		if (task->task_state_flags & SAS_TASK_STATE_ABORTED) {
+			pm8001_dbg(pm8001_ha, FAIL, "TMF task[%x]timeout.\n",
+				   tmf->tmf);
+			goto ex_err;
 		}
 
 		if (task->task_status.resp == SAS_TASK_COMPLETE &&
@@ -832,12 +833,9 @@  pm8001_exec_internal_task_abort(struct pm8001_hba_info *pm8001_ha,
 		wait_for_completion(&task->slow_task->completion);
 		res = TMF_RESP_FUNC_FAILED;
 		/* Even TMF timed out, return direct. */
-		if ((task->task_state_flags & SAS_TASK_STATE_ABORTED)) {
-			if (!(task->task_state_flags & SAS_TASK_STATE_DONE)) {
-				pm8001_dbg(pm8001_ha, FAIL,
-					   "TMF task timeout.\n");
-				goto ex_err;
-			}
+		if (task->task_state_flags & SAS_TASK_STATE_ABORTED) {
+			pm8001_dbg(pm8001_ha, FAIL, "TMF task timeout.\n");
+			goto ex_err;
 		}
 
 		if (task->task_status.resp == SAS_TASK_COMPLETE &&