releases/4.9.179/md-raid-raid5-preserve-the-writeback-action-after-the-parity-check.patch - pub/scm/linux/kernel/git/stable/stable-queue - Git at Google

 From b2176a1dfb518d870ee073445d27055fea64dfb8 Mon Sep 17 00:00:00 2001
 From: Nigel Croxon <ncroxon@redhat.com>
 Date: Tue, 16 Apr 2019 09:50:09 -0700
 Subject: md/raid: raid5 preserve the writeback action after the parity check

 From: Nigel Croxon <ncroxon@redhat.com>

 commit b2176a1dfb518d870ee073445d27055fea64dfb8 upstream.

 The problem is that any 'uptodate' vs 'disks' check is not precise
 in this path. Put a "WARN_ON(!test_bit(R5_UPTODATE, &dev->flags)" on the
 device that might try to kick off writes and then skip the action.
 Better to prevent the raid driver from taking unexpected action *and* keep
 the system alive vs killing the machine with BUG_ON.

 Note: fixed warning reported by kbuild test robot <lkp@intel.com>

 Signed-off-by: Dan Williams <dan.j.williams@intel.com>
 Signed-off-by: Nigel Croxon <ncroxon@redhat.com>
 Signed-off-by: Song Liu <songliubraving@fb.com>
 Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>

 ---
  drivers/md/raid5.c |   10 +++++++++-
  1 file changed, 9 insertions(+), 1 deletion(-)

 --- a/drivers/md/raid5.c
 +++ b/drivers/md/raid5.c
 @@ -3878,7 +3878,7 @@ static void handle_parity_checks6(struct
  		/* now write out any block on a failed drive,
  		 * or P or Q if they were recomputed
  		 */
 -		BUG_ON(s->uptodate < disks - 1); /* We don't need Q to recover */
 +		dev = NULL;
  		if (s->failed == 2) {
  			dev = &sh->dev[s->failed_num[1]];
  			s->locked++;
 @@ -3903,6 +3903,14 @@ static void handle_parity_checks6(struct
  			set_bit(R5_LOCKED, &dev->flags);
  			set_bit(R5_Wantwrite, &dev->flags);
  		}
 +		if (WARN_ONCE(dev && !test_bit(R5_UPTODATE, &dev->flags),
 +			      "%s: disk%td not up to date\n",
 +			      mdname(conf->mddev),
 +			      dev - (struct r5dev *) &sh->dev)) {
 +			clear_bit(R5_LOCKED, &dev->flags);
 +			clear_bit(R5_Wantwrite, &dev->flags);
 +			s->locked--;
 +		}
  		clear_bit(STRIPE_DEGRADED, &sh->state);

  		set_bit(STRIPE_INSYNC, &sh->state);
	From b2176a1dfb518d870ee073445d27055fea64dfb8 Mon Sep 17 00:00:00 2001
	From: Nigel Croxon <ncroxon@redhat.com>
	Date: Tue, 16 Apr 2019 09:50:09 -0700
	Subject: md/raid: raid5 preserve the writeback action after the parity check

	From: Nigel Croxon <ncroxon@redhat.com>

	commit b2176a1dfb518d870ee073445d27055fea64dfb8 upstream.

	The problem is that any 'uptodate' vs 'disks' check is not precise
	in this path. Put a "WARN_ON(!test_bit(R5_UPTODATE, &dev->flags)" on the
	device that might try to kick off writes and then skip the action.
	Better to prevent the raid driver from taking unexpected action and keep
	the system alive vs killing the machine with BUG_ON.

	Note: fixed warning reported by kbuild test robot <lkp@intel.com>

	Signed-off-by: Dan Williams <dan.j.williams@intel.com>
	Signed-off-by: Nigel Croxon <ncroxon@redhat.com>
	Signed-off-by: Song Liu <songliubraving@fb.com>
	Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>

	---
	drivers/md/raid5.c \| 10 +++++++++-
	1 file changed, 9 insertions(+), 1 deletion(-)

	--- a/drivers/md/raid5.c
	+++ b/drivers/md/raid5.c
	@@ -3878,7 +3878,7 @@ static void handle_parity_checks6(struct
	/* now write out any block on a failed drive,
	* or P or Q if they were recomputed
	*/
	- BUG_ON(s->uptodate < disks - 1); /* We don't need Q to recover */
	+ dev = NULL;
	if (s->failed == 2) {
	dev = &sh->dev[s->failed_num[1]];
	s->locked++;
	@@ -3903,6 +3903,14 @@ static void handle_parity_checks6(struct
	set_bit(R5_LOCKED, &dev->flags);
	set_bit(R5_Wantwrite, &dev->flags);
	}
	+ if (WARN_ONCE(dev && !test_bit(R5_UPTODATE, &dev->flags),
	+ "%s: disk%td not up to date\n",
	+ mdname(conf->mddev),
	+ dev - (struct r5dev *) &sh->dev)) {
	+ clear_bit(R5_LOCKED, &dev->flags);
	+ clear_bit(R5_Wantwrite, &dev->flags);
	+ s->locked--;
	+ }
	clear_bit(STRIPE_DEGRADED, &sh->state);

	set_bit(STRIPE_INSYNC, &sh->state);