* [patch 1/3 v4]raid1: make sequential read detection per disk based
@ 2012-07-05 9:20 Shaohua Li
2012-07-16 4:24 ` NeilBrown
0 siblings, 1 reply; 2+ messages in thread
From: Shaohua Li @ 2012-07-05 9:20 UTC (permalink / raw)
To: linux-raid; +Cc: neilb
Currently the sequential read detection is global wide. It's natural to make it
per disk based, which can improve the detection for concurrent multiple
sequential reads. And next patch will make SSD read balance not use distance
based algorithm, where this change help detect truly sequential read for SSD.
Signed-off-by: Shaohua Li <shli@fusionio.com>
---
drivers/md/raid1.c | 29 ++++++-----------------------
drivers/md/raid1.h | 11 +++++------
2 files changed, 11 insertions(+), 29 deletions(-)
Index: linux/drivers/md/raid1.c
===================================================================
--- linux.orig/drivers/md/raid1.c 2012-07-04 11:53:32.000000000 +0800
+++ linux/drivers/md/raid1.c 2012-07-04 15:23:51.114885573 +0800
@@ -483,7 +483,6 @@ static int read_balance(struct r1conf *c
const sector_t this_sector = r1_bio->sector;
int sectors;
int best_good_sectors;
- int start_disk;
int best_disk;
int i;
sector_t best_dist;
@@ -503,20 +502,17 @@ static int read_balance(struct r1conf *c
best_good_sectors = 0;
if (conf->mddev->recovery_cp < MaxSector &&
- (this_sector + sectors >= conf->next_resync)) {
+ (this_sector + sectors >= conf->next_resync))
choose_first = 1;
- start_disk = 0;
- } else {
+ else
choose_first = 0;
- start_disk = conf->last_used;
- }
for (i = 0 ; i < conf->raid_disks * 2 ; i++) {
sector_t dist;
sector_t first_bad;
int bad_sectors;
- int disk = start_disk + i;
+ int disk = i;
if (disk >= conf->raid_disks * 2)
disk -= conf->raid_disks * 2;
@@ -580,7 +576,7 @@ static int read_balance(struct r1conf *c
dist = abs(this_sector - conf->mirrors[disk].head_position);
if (choose_first
/* Don't change to another disk for sequential reads */
- || conf->next_seq_sect == this_sector
+ || conf->mirrors[disk].next_seq_sect == this_sector
|| dist == 0
/* If device is idle, use it */
|| atomic_read(&rdev->nr_pending) == 0) {
@@ -606,8 +602,7 @@ static int read_balance(struct r1conf *c
goto retry;
}
sectors = best_good_sectors;
- conf->next_seq_sect = this_sector + sectors;
- conf->last_used = best_disk;
+ conf->mirrors[best_disk].next_seq_sect = this_sector + sectors;
}
rcu_read_unlock();
*max_sectors = sectors;
@@ -2578,7 +2573,6 @@ static struct r1conf *setup_conf(struct
conf->recovery_disabled = mddev->recovery_disabled - 1;
err = -EIO;
- conf->last_used = -1;
for (i = 0; i < conf->raid_disks * 2; i++) {
disk = conf->mirrors + i;
@@ -2604,19 +2598,9 @@ static struct r1conf *setup_conf(struct
if (disk->rdev &&
(disk->rdev->saved_raid_disk < 0))
conf->fullsync = 1;
- } else if (conf->last_used < 0)
- /*
- * The first working device is used as a
- * starting point to read balancing.
- */
- conf->last_used = i;
+ }
}
- if (conf->last_used < 0) {
- printk(KERN_ERR "md/raid1:%s: no operational mirrors\n",
- mdname(mddev));
- goto abort;
- }
err = -ENOMEM;
conf->thread = md_register_thread(raid1d, mddev, "raid1");
if (!conf->thread) {
@@ -2873,7 +2857,6 @@ static int raid1_reshape(struct mddev *m
conf->raid_disks = mddev->raid_disks = raid_disks;
mddev->delta_disks = 0;
- conf->last_used = 0; /* just make sure it is in-range */
lower_barrier(conf);
set_bit(MD_RECOVERY_NEEDED, &mddev->recovery);
Index: linux/drivers/md/raid1.h
===================================================================
--- linux.orig/drivers/md/raid1.h 2012-07-02 09:19:11.000000000 +0800
+++ linux/drivers/md/raid1.h 2012-07-04 15:23:51.114885573 +0800
@@ -4,6 +4,11 @@
struct mirror_info {
struct md_rdev *rdev;
sector_t head_position;
+
+ /* When choose the best device for a read (read_balance())
+ * we try to keep sequential reads one the same device
+ */
+ sector_t next_seq_sect;
};
/*
@@ -29,12 +34,6 @@ struct r1conf {
*/
int raid_disks;
- /* When choose the best device for a read (read_balance())
- * we try to keep sequential reads one the same device
- * using 'last_used' and 'next_seq_sect'
- */
- int last_used;
- sector_t next_seq_sect;
/* During resync, read_balancing is only allowed on the part
* of the array that has been resynced. 'next_resync' tells us
* where that is.
^ permalink raw reply [flat|nested] 2+ messages in thread
* Re: [patch 1/3 v4]raid1: make sequential read detection per disk based
2012-07-05 9:20 [patch 1/3 v4]raid1: make sequential read detection per disk based Shaohua Li
@ 2012-07-16 4:24 ` NeilBrown
0 siblings, 0 replies; 2+ messages in thread
From: NeilBrown @ 2012-07-16 4:24 UTC (permalink / raw)
To: Shaohua Li; +Cc: linux-raid
[-- Attachment #1: Type: text/plain, Size: 1992 bytes --]
On Thu, 5 Jul 2012 17:20:31 +0800 Shaohua Li <shli@kernel.org> wrote:
> Currently the sequential read detection is global wide. It's natural to make it
> per disk based, which can improve the detection for concurrent multiple
> sequential reads. And next patch will make SSD read balance not use distance
> based algorithm, where this change help detect truly sequential read for SSD.
>
> Signed-off-by: Shaohua Li <shli@fusionio.com>
> ---
> drivers/md/raid1.c | 29 ++++++-----------------------
> drivers/md/raid1.h | 11 +++++------
> 2 files changed, 11 insertions(+), 29 deletions(-)
>
> Index: linux/drivers/md/raid1.c
> ===================================================================
> --- linux.orig/drivers/md/raid1.c 2012-07-04 11:53:32.000000000 +0800
> +++ linux/drivers/md/raid1.c 2012-07-04 15:23:51.114885573 +0800
> @@ -483,7 +483,6 @@ static int read_balance(struct r1conf *c
> const sector_t this_sector = r1_bio->sector;
> int sectors;
> int best_good_sectors;
> - int start_disk;
> int best_disk;
> int i;
> sector_t best_dist;
> @@ -503,20 +502,17 @@ static int read_balance(struct r1conf *c
> best_good_sectors = 0;
>
> if (conf->mddev->recovery_cp < MaxSector &&
> - (this_sector + sectors >= conf->next_resync)) {
> + (this_sector + sectors >= conf->next_resync))
> choose_first = 1;
> - start_disk = 0;
> - } else {
> + else
> choose_first = 0;
> - start_disk = conf->last_used;
> - }
>
> for (i = 0 ; i < conf->raid_disks * 2 ; i++) {
> sector_t dist;
> sector_t first_bad;
> int bad_sectors;
>
> - int disk = start_disk + i;
> + int disk = i;
> if (disk >= conf->raid_disks * 2)
> disk -= conf->raid_disks * 2;
You forgot the change I asked for here to make it
for (disk = 0; disk < ..... ; disk++)
but you've fixed up all the other bits nicely, so I made the above change and
have applied all three patches, thanks.
NeilBrown
[-- Attachment #2: signature.asc --]
[-- Type: application/pgp-signature, Size: 828 bytes --]
^ permalink raw reply [flat|nested] 2+ messages in thread
end of thread, other threads:[~2012-07-16 4:24 UTC | newest]
Thread overview: 2+ messages (download: mbox.gz follow: Atom feed
-- links below jump to the message on this page --
2012-07-05 9:20 [patch 1/3 v4]raid1: make sequential read detection per disk based Shaohua Li
2012-07-16 4:24 ` NeilBrown
This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox;
as well as URLs for NNTP newsgroup(s).